[ { "page_no": 0, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.3, "r_y0": 119.93, "r_x1": 498.93, "r_y1": 119.93, "r_x2": 498.93, "r_y2": 107.03, "r_x3": 96.3, "r_y3": 107.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.48, "r_y0": 157.37, "r_x1": 452.75, "r_y1": 157.37, "r_x2": 452.75, "r_y2": 146.69, "r_x3": 142.48, "r_y3": 146.69, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.92, "r_y0": 171.32, "r_x1": 332.31, "r_y1": 171.32, "r_x2": 332.31, "r_y2": 160.63, "r_x3": 262.92, "r_y3": 160.63, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 226.23, "r_x1": 190.48, "r_y1": 226.23, "r_x2": 190.48, "r_y2": 215.48, "r_x3": 145.99, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 249.98, "r_x1": 286.36, "r_y1": 249.98, "r_x2": 286.36, "r_y2": 241.4, "r_x3": 62.07, "r_y3": 241.4, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 261.94, "r_x1": 286.37, "r_y1": 261.94, "r_x2": 286.37, "r_y2": 253.35, "r_x3": 50.11, "r_y3": 253.35, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 273.89, "r_x1": 286.37, "r_y1": 273.89, "r_x2": 286.37, "r_y2": 265.31, "r_x3": 50.11, "r_y3": 265.31, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 285.85, "r_x1": 286.37, "r_y1": 285.85, "r_x2": 286.37, "r_y2": 277.26, "r_x3": 50.11, "r_y3": 277.26, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 297.8, "r_x1": 286.37, "r_y1": 297.8, "r_x2": 286.37, "r_y2": 289.22, "r_x3": 50.11, "r_y3": 289.22, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 309.76, "r_x1": 286.37, "r_y1": 309.76, "r_x2": 286.37, "r_y2": 301.17, "r_x3": 50.11, "r_y3": 301.17, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 321.71, "r_x1": 286.37, "r_y1": 321.71, "r_x2": 286.37, "r_y2": 313.13, "r_x3": 50.11, "r_y3": 313.13, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 333.67, "r_x1": 286.37, "r_y1": 333.67, "r_x2": 286.37, "r_y2": 325.08, "r_x3": 50.11, "r_y3": 325.08, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 345.62, "r_x1": 286.37, "r_y1": 345.62, "r_x2": 286.37, "r_y2": 337.04, "r_x3": 50.11, "r_y3": 337.04, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 357.58, "r_x1": 286.37, "r_y1": 357.58, "r_x2": 286.37, "r_y2": 348.99, "r_x3": 50.11, "r_y3": 348.99, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 369.53, "r_x1": 286.37, "r_y1": 369.53, "r_x2": 286.37, "r_y2": 360.95, "r_x3": 50.11, "r_y3": 360.95, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 381.49, "r_x1": 286.37, "r_y1": 381.49, "r_x2": 286.37, "r_y2": 372.9, "r_x3": 50.11, "r_y3": 372.9, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 393.44, "r_x1": 286.37, "r_y1": 393.44, "r_x2": 286.37, "r_y2": 384.86, "r_x3": 50.11, "r_y3": 384.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 405.4, "r_x1": 286.37, "r_y1": 405.4, "r_x2": 286.37, "r_y2": 396.81, "r_x3": 50.11, "r_y3": 396.81, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 417.35, "r_x1": 286.37, "r_y1": 417.35, "r_x2": 286.37, "r_y2": 408.77, "r_x3": 50.11, "r_y3": 408.77, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 429.31, "r_x1": 286.37, "r_y1": 429.31, "r_x2": 286.37, "r_y2": 420.72, "r_x3": 50.11, "r_y3": 420.72, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 441.27, "r_x1": 207.23, "r_y1": 441.27, "r_x2": 207.23, "r_y2": 432.68, "r_x3": 50.11, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.1, "r_y0": 441.27, "r_x1": 286.37, "r_y1": 441.27, "r_x2": 286.37, "r_y2": 432.68, "r_x3": 214.1, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 453.22, "r_x1": 286.37, "r_y1": 453.22, "r_x2": 286.37, "r_y2": 444.63, "r_x3": 50.11, "r_y3": 444.63, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 465.18, "r_x1": 286.37, "r_y1": 465.18, "r_x2": 286.37, "r_y2": 456.59, "r_x3": 50.11, "r_y3": 456.59, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 477.13, "r_x1": 286.37, "r_y1": 477.13, "r_x2": 286.37, "r_y2": 468.54, "r_x3": 50.11, "r_y3": 468.54, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 489.09, "r_x1": 286.37, "r_y1": 489.09, "r_x2": 286.37, "r_y2": 480.5, "r_x3": 50.11, "r_y3": 480.5, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.04, "r_x1": 286.37, "r_y1": 501.04, "r_x2": 286.37, "r_y2": 492.45, "r_x3": 50.11, "r_y3": 492.45, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 513.0, "r_x1": 276.65, "r_y1": 513.0, "r_x2": 276.65, "r_y2": 504.41, "r_x3": 50.11, "r_y3": 504.41, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.69, "r_x1": 58.12, "r_y1": 550.69, "r_x2": 58.12, "r_y2": 539.94, "r_x3": 50.11, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.8, "r_y0": 550.69, "r_x1": 126.95, "r_y1": 550.69, "r_x2": 126.95, "r_y2": 539.94, "r_x3": 68.8, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 569.69, "r_x1": 286.36, "r_y1": 569.69, "r_x2": 286.36, "r_y2": 560.78, "r_x3": 62.07, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 76.4, "r_y1": 713.15, "r_x2": 76.4, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 226.75, "r_x1": 324.01, "r_y1": 226.75, "r_x2": 324.01, "r_y2": 218.01, "r_x3": 315.57, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.23, "r_y0": 226.75, "r_x1": 408.44, "r_y1": 226.75, "r_x2": 408.44, "r_y2": 218.01, "r_x3": 328.23, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 322.44, "r_x1": 325.06, "r_y1": 322.44, "r_x2": 325.06, "r_y2": 313.69, "r_x3": 315.57, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.8, "r_y0": 322.44, "r_x1": 486.4, "r_y1": 322.44, "r_x2": 486.4, "r_y2": 313.69, "r_x3": 329.8, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46, "r_y0": 333.24, "r_x1": 472.47, "r_y1": 333.24, "r_x2": 472.47, "r_y2": 324.49, "r_x3": 326.46, "r_y3": 324.49, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 428.93, "r_x1": 324.81, "r_y1": 428.93, "r_x2": 324.81, "r_y2": 420.18, "r_x3": 315.57, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.43, "r_y0": 428.93, "r_x1": 491.19, "r_y1": 428.93, "r_x2": 491.19, "r_y2": 420.18, "r_x3": 329.43, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 523.41, "r_x1": 345.73, "r_y1": 523.41, "r_x2": 345.73, "r_y2": 514.5, "r_x3": 308.86, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18, "r_y0": 523.41, "r_x1": 545.12, "r_y1": 523.41, "r_x2": 545.12, "r_y2": 514.5, "r_x3": 353.18, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 535.36, "r_x1": 545.12, "r_y1": 535.36, "r_x2": 545.12, "r_y2": 526.46, "r_x3": 308.86, "r_y3": 526.46, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 547.32, "r_x1": 545.12, "r_y1": 547.32, "r_x2": 545.12, "r_y2": 538.41, "r_x3": 308.86, "r_y3": 538.41, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 559.27, "r_x1": 505.69, "r_y1": 559.27, "r_x2": 505.69, "r_y2": 550.37, "r_x3": 308.86, "r_y3": 550.37, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 593.32, "r_x1": 545.11, "r_y1": 593.32, "r_x2": 545.11, "r_y2": 584.41, "r_x3": 320.82, "r_y3": 584.41, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.27, "r_x1": 545.12, "r_y1": 605.27, "r_x2": 545.12, "r_y2": 596.36, "r_x3": 308.86, "r_y3": 596.36, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.23, "r_x1": 545.12, "r_y1": 617.23, "r_x2": 545.12, "r_y2": 608.32, "r_x3": 308.86, "r_y3": 608.32, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.18, "r_x1": 545.12, "r_y1": 629.18, "r_x2": 545.12, "r_y2": 620.27, "r_x3": 308.86, "r_y3": 620.27, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.14, "r_x1": 353.69, "r_y1": 641.14, "r_x2": 353.69, "r_y2": 632.23, "r_x3": 308.86, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11, "r_y0": 641.14, "r_x1": 374.67, "r_y1": 641.14, "r_x2": 374.67, "r_y2": 632.23, "r_x3": 362.11, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.36, "r_y0": 641.14, "r_x1": 545.12, "r_y1": 641.14, "r_x2": 545.12, "r_y2": 632.23, "r_x3": 377.36, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.09, "r_x1": 545.12, "r_y1": 653.09, "r_x2": 545.12, "r_y2": 644.19, "r_x3": 308.86, "r_y3": 644.19, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.05, "r_x1": 375.55, "r_y1": 665.05, "r_x2": 375.55, "r_y2": 656.14, "r_x3": 308.86, "r_y3": 656.14, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 320.82, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.11, "r_y1": 713.15, "r_x2": 545.11, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 560.0, "r_x2": 36.34, "r_y2": 207.82, "r_x3": 18.34, "r_y3": 207.82, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 8, "label": "section_header", "bbox": { "l": 96.3, "t": 107.03, "r": 498.93, "b": 119.93, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.3, "r_y0": 119.93, "r_x1": 498.93, "r_y1": 119.93, "r_x2": 498.93, "r_y2": 107.03, "r_x3": 96.3, "r_y3": 107.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 142.48, "t": 146.69, "r": 452.75, "b": 171.32, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.48, "r_y0": 157.37, "r_x1": 452.75, "r_y1": 157.37, "r_x2": 452.75, "r_y2": 146.69, "r_x3": 142.48, "r_y3": 146.69, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.92, "r_y0": 171.32, "r_x1": 332.31, "r_y1": 171.32, "r_x2": 332.31, "r_y2": 160.63, "r_x3": 262.92, "r_y3": 160.63, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "key_value_region", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.485, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "section_header", "bbox": { "l": 145.99, "t": 215.48, "r": 190.48, "b": 226.23, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 226.23, "r_x1": 190.48, "r_y1": 226.23, "r_x2": 190.48, "r_y2": 215.48, "r_x3": 145.99, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 241.4, "r": 286.37, "b": 513.0, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 249.98, "r_x1": 286.36, "r_y1": 249.98, "r_x2": 286.36, "r_y2": 241.4, "r_x3": 62.07, "r_y3": 241.4, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 261.94, "r_x1": 286.37, "r_y1": 261.94, "r_x2": 286.37, "r_y2": 253.35, "r_x3": 50.11, "r_y3": 253.35, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 273.89, "r_x1": 286.37, "r_y1": 273.89, "r_x2": 286.37, "r_y2": 265.31, "r_x3": 50.11, "r_y3": 265.31, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 285.85, "r_x1": 286.37, "r_y1": 285.85, "r_x2": 286.37, "r_y2": 277.26, "r_x3": 50.11, "r_y3": 277.26, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 297.8, "r_x1": 286.37, "r_y1": 297.8, "r_x2": 286.37, "r_y2": 289.22, "r_x3": 50.11, "r_y3": 289.22, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 309.76, "r_x1": 286.37, "r_y1": 309.76, "r_x2": 286.37, "r_y2": 301.17, "r_x3": 50.11, "r_y3": 301.17, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 321.71, "r_x1": 286.37, "r_y1": 321.71, "r_x2": 286.37, "r_y2": 313.13, "r_x3": 50.11, "r_y3": 313.13, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 333.67, "r_x1": 286.37, "r_y1": 333.67, "r_x2": 286.37, "r_y2": 325.08, "r_x3": 50.11, "r_y3": 325.08, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 345.62, "r_x1": 286.37, "r_y1": 345.62, "r_x2": 286.37, "r_y2": 337.04, "r_x3": 50.11, "r_y3": 337.04, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 357.58, "r_x1": 286.37, "r_y1": 357.58, "r_x2": 286.37, "r_y2": 348.99, "r_x3": 50.11, "r_y3": 348.99, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 369.53, "r_x1": 286.37, "r_y1": 369.53, "r_x2": 286.37, "r_y2": 360.95, "r_x3": 50.11, "r_y3": 360.95, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 381.49, "r_x1": 286.37, "r_y1": 381.49, "r_x2": 286.37, "r_y2": 372.9, "r_x3": 50.11, "r_y3": 372.9, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 393.44, "r_x1": 286.37, "r_y1": 393.44, "r_x2": 286.37, "r_y2": 384.86, "r_x3": 50.11, "r_y3": 384.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 405.4, "r_x1": 286.37, "r_y1": 405.4, "r_x2": 286.37, "r_y2": 396.81, "r_x3": 50.11, "r_y3": 396.81, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 417.35, "r_x1": 286.37, "r_y1": 417.35, "r_x2": 286.37, "r_y2": 408.77, "r_x3": 50.11, "r_y3": 408.77, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 429.31, "r_x1": 286.37, "r_y1": 429.31, "r_x2": 286.37, "r_y2": 420.72, "r_x3": 50.11, "r_y3": 420.72, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 441.27, "r_x1": 207.23, "r_y1": 441.27, "r_x2": 207.23, "r_y2": 432.68, "r_x3": 50.11, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.1, "r_y0": 441.27, "r_x1": 286.37, "r_y1": 441.27, "r_x2": 286.37, "r_y2": 432.68, "r_x3": 214.1, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 453.22, "r_x1": 286.37, "r_y1": 453.22, "r_x2": 286.37, "r_y2": 444.63, "r_x3": 50.11, "r_y3": 444.63, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 465.18, "r_x1": 286.37, "r_y1": 465.18, "r_x2": 286.37, "r_y2": 456.59, "r_x3": 50.11, "r_y3": 456.59, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 477.13, "r_x1": 286.37, "r_y1": 477.13, "r_x2": 286.37, "r_y2": 468.54, "r_x3": 50.11, "r_y3": 468.54, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 489.09, "r_x1": 286.37, "r_y1": 489.09, "r_x2": 286.37, "r_y2": 480.5, "r_x3": 50.11, "r_y3": 480.5, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.04, "r_x1": 286.37, "r_y1": 501.04, "r_x2": 286.37, "r_y2": 492.45, "r_x3": 50.11, "r_y3": 492.45, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 513.0, "r_x1": 276.65, "r_y1": 513.0, "r_x2": 276.65, "r_y2": 504.41, "r_x3": 50.11, "r_y3": 504.41, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 50.11, "t": 539.94, "r": 126.95, "b": 550.69, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.69, "r_x1": 58.12, "r_y1": 550.69, "r_x2": 58.12, "r_y2": 539.94, "r_x3": 50.11, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.8, "r_y0": 550.69, "r_x1": 126.95, "r_y1": 550.69, "r_x2": 126.95, "r_y2": 539.94, "r_x3": 68.8, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 560.78, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 569.69, "r_x1": 286.36, "r_y1": 569.69, "r_x2": 286.36, "r_y2": 560.78, "r_x3": 62.07, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 76.4, "r_y1": 713.15, "r_x2": 76.4, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 315.57, "t": 218.01, "r": 408.44, "b": 226.75, "coord_origin": "TOPLEFT" }, "confidence": 0.672, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 226.75, "r_x1": 324.01, "r_y1": 226.75, "r_x2": 324.01, "r_y2": 218.01, "r_x3": 315.57, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.23, "r_y0": 226.75, "r_x1": 408.44, "r_y1": 226.75, "r_x2": 408.44, "r_y2": 218.01, "r_x3": 328.23, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 315.57, "t": 313.69, "r": 486.4, "b": 333.24, "coord_origin": "TOPLEFT" }, "confidence": 0.555, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 322.44, "r_x1": 325.06, "r_y1": 322.44, "r_x2": 325.06, "r_y2": 313.69, "r_x3": 315.57, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.8, "r_y0": 322.44, "r_x1": 486.4, "r_y1": 322.44, "r_x2": 486.4, "r_y2": 313.69, "r_x3": 329.8, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46, "r_y0": 333.24, "r_x1": 472.47, "r_y1": 333.24, "r_x2": 472.47, "r_y2": 324.49, "r_x3": 326.46, "r_y3": 324.49, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 315.57, "t": 420.18, "r": 491.19, "b": 428.93, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 428.93, "r_x1": 324.81, "r_y1": 428.93, "r_x2": 324.81, "r_y2": 420.18, "r_x3": 315.57, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.43, "r_y0": 428.93, "r_x1": 491.19, "r_y1": 428.93, "r_x2": 491.19, "r_y2": 420.18, "r_x3": 329.43, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "picture", "bbox": { "l": 314.78, "t": 338.07, "r": 539.18, "b": 410.05, "coord_origin": "TOPLEFT" }, "confidence": 0.874, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.15, "t": 342.83, "r": 412.54, "b": 351.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11, "t": 341.57, "r": 360.5, "b": 350.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.68, "t": 340.94, "r": 505.07, "b": 349.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13, "t": 351.75, "r": 360.53, "b": 360.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.54, "t": 355.88, "r": 406.93, "b": 364.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58, "t": 352.84, "r": 452.97, "b": 361.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65, "t": 353.71, "r": 496.04, "b": 362.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.14, "t": 353.34, "r": 539.53, "b": 362.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.83, "t": 387.1, "r": 353.22, "b": 395.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27, "t": 375.37, "r": 393.66, "b": 384.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67, "t": 375.65, "r": 451.46, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.44, "t": 375.53, "r": 485.9, "b": 384.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57, "t": 375.65, "r": 531.36, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.23, "t": 387.11, "r": 409.01, "b": 395.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.31, "t": 386.99, "r": 451.09, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.22, "t": 387.37, "r": 487.0, "b": 396.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.23, "t": 386.99, "r": 532.01, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57, "t": 399.42, "r": 415.96, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96, "t": 399.42, "r": 420.36, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.31, "t": 399.04, "r": 451.09, "b": 407.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.78, "t": 399.0, "r": 487.56, "b": 407.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97, "t": 398.61, "r": 532.76, "b": 407.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09, "t": 357.76, "r": 391.1, "b": 367.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43, "t": 380.73, "r": 339.44, "b": 390.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07, "t": 341.04, "r": 484.08, "b": 351.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 23, "label": "picture", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.509, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "table", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 16, "label": "picture", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.609, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 15, "label": "table", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.652, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 308.86, "t": 514.5, "r": 545.12, "b": 559.27, "coord_origin": "TOPLEFT" }, "confidence": 0.921, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 523.41, "r_x1": 345.73, "r_y1": 523.41, "r_x2": 345.73, "r_y2": 514.5, "r_x3": 308.86, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18, "r_y0": 523.41, "r_x1": 545.12, "r_y1": 523.41, "r_x2": 545.12, "r_y2": 514.5, "r_x3": 353.18, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 535.36, "r_x1": 545.12, "r_y1": 535.36, "r_x2": 545.12, "r_y2": 526.46, "r_x3": 308.86, "r_y3": 526.46, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 547.32, "r_x1": 545.12, "r_y1": 547.32, "r_x2": 545.12, "r_y2": 538.41, "r_x3": 308.86, "r_y3": 538.41, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 559.27, "r_x1": 505.69, "r_y1": 559.27, "r_x2": 505.69, "r_y2": 550.37, "r_x3": 308.86, "r_y3": 550.37, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 584.41, "r": 545.12, "b": 665.05, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 593.32, "r_x1": 545.11, "r_y1": 593.32, "r_x2": 545.11, "r_y2": 584.41, "r_x3": 320.82, "r_y3": 584.41, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.27, "r_x1": 545.12, "r_y1": 605.27, "r_x2": 545.12, "r_y2": 596.36, "r_x3": 308.86, "r_y3": 596.36, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.23, "r_x1": 545.12, "r_y1": 617.23, "r_x2": 545.12, "r_y2": 608.32, "r_x3": 308.86, "r_y3": 608.32, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.18, "r_x1": 545.12, "r_y1": 629.18, "r_x2": 545.12, "r_y2": 620.27, "r_x3": 308.86, "r_y3": 620.27, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.14, "r_x1": 353.69, "r_y1": 641.14, "r_x2": 353.69, "r_y2": 632.23, "r_x3": 308.86, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11, "r_y0": 641.14, "r_x1": 374.67, "r_y1": 641.14, "r_x2": 374.67, "r_y2": 632.23, "r_x3": 362.11, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.36, "r_y0": 641.14, "r_x1": 545.12, "r_y1": 641.14, "r_x2": 545.12, "r_y2": 632.23, "r_x3": 377.36, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.09, "r_x1": 545.12, "r_y1": 653.09, "r_x2": 545.12, "r_y2": 644.19, "r_x3": 308.86, "r_y3": 644.19, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.05, "r_x1": 375.55, "r_y1": 665.05, "r_x2": 375.55, "r_y2": 656.14, "r_x3": 308.86, "r_y3": 656.14, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 668.38, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 320.82, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.11, "r_y1": 713.15, "r_x2": 545.11, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.805, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 18.34, "t": 207.82, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 560.0, "r_x2": 36.34, "r_y2": 207.82, "r_x3": 18.34, "r_y3": 207.82, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "11": { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, "15": { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.652, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 8, "page_no": 0, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 96.3, "t": 107.03, "r": 498.93, "b": 119.93, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.3, "r_y0": 119.93, "r_x1": 498.93, "r_y1": 119.93, "r_x2": 498.93, "r_y2": 107.03, "r_x3": 96.3, "r_y3": 107.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers." }, { "label": "section_header", "id": 13, "page_no": 0, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 142.48, "t": 146.69, "r": 452.75, "b": 171.32, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.48, "r_y0": 157.37, "r_x1": 452.75, "r_y1": 157.37, "r_x2": 452.75, "r_y2": 146.69, "r_x3": 142.48, "r_y3": 146.69, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.92, "r_y0": 171.32, "r_x1": 332.31, "r_y1": 171.32, "r_x2": 332.31, "r_y2": 160.63, "r_x3": 262.92, "r_y3": 160.63, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research" }, { "label": "key_value_region", "id": 25, "page_no": 0, "cluster": { "id": 25, "label": "key_value_region", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.485, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 145.99, "t": 215.48, "r": 190.48, "b": 226.23, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 226.23, "r_x1": 190.48, "r_y1": 226.23, "r_x2": 190.48, "r_y2": 215.48, "r_x3": 145.99, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract" }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 241.4, "r": 286.37, "b": 513.0, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 249.98, "r_x1": 286.36, "r_y1": 249.98, "r_x2": 286.36, "r_y2": 241.4, "r_x3": 62.07, "r_y3": 241.4, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 261.94, "r_x1": 286.37, "r_y1": 261.94, "r_x2": 286.37, "r_y2": 253.35, "r_x3": 50.11, "r_y3": 253.35, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 273.89, "r_x1": 286.37, "r_y1": 273.89, "r_x2": 286.37, "r_y2": 265.31, "r_x3": 50.11, "r_y3": 265.31, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 285.85, "r_x1": 286.37, "r_y1": 285.85, "r_x2": 286.37, "r_y2": 277.26, "r_x3": 50.11, "r_y3": 277.26, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 297.8, "r_x1": 286.37, "r_y1": 297.8, "r_x2": 286.37, "r_y2": 289.22, "r_x3": 50.11, "r_y3": 289.22, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 309.76, "r_x1": 286.37, "r_y1": 309.76, "r_x2": 286.37, "r_y2": 301.17, "r_x3": 50.11, "r_y3": 301.17, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 321.71, "r_x1": 286.37, "r_y1": 321.71, "r_x2": 286.37, "r_y2": 313.13, "r_x3": 50.11, "r_y3": 313.13, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 333.67, "r_x1": 286.37, "r_y1": 333.67, "r_x2": 286.37, "r_y2": 325.08, "r_x3": 50.11, "r_y3": 325.08, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 345.62, "r_x1": 286.37, "r_y1": 345.62, "r_x2": 286.37, "r_y2": 337.04, "r_x3": 50.11, "r_y3": 337.04, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 357.58, "r_x1": 286.37, "r_y1": 357.58, "r_x2": 286.37, "r_y2": 348.99, "r_x3": 50.11, "r_y3": 348.99, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 369.53, "r_x1": 286.37, "r_y1": 369.53, "r_x2": 286.37, "r_y2": 360.95, "r_x3": 50.11, "r_y3": 360.95, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 381.49, "r_x1": 286.37, "r_y1": 381.49, "r_x2": 286.37, "r_y2": 372.9, "r_x3": 50.11, "r_y3": 372.9, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 393.44, "r_x1": 286.37, "r_y1": 393.44, "r_x2": 286.37, "r_y2": 384.86, "r_x3": 50.11, "r_y3": 384.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 405.4, "r_x1": 286.37, "r_y1": 405.4, "r_x2": 286.37, "r_y2": 396.81, "r_x3": 50.11, "r_y3": 396.81, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 417.35, "r_x1": 286.37, "r_y1": 417.35, "r_x2": 286.37, "r_y2": 408.77, "r_x3": 50.11, "r_y3": 408.77, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 429.31, "r_x1": 286.37, "r_y1": 429.31, "r_x2": 286.37, "r_y2": 420.72, "r_x3": 50.11, "r_y3": 420.72, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 441.27, "r_x1": 207.23, "r_y1": 441.27, "r_x2": 207.23, "r_y2": 432.68, "r_x3": 50.11, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.1, "r_y0": 441.27, "r_x1": 286.37, "r_y1": 441.27, "r_x2": 286.37, "r_y2": 432.68, "r_x3": 214.1, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 453.22, "r_x1": 286.37, "r_y1": 453.22, "r_x2": 286.37, "r_y2": 444.63, "r_x3": 50.11, "r_y3": 444.63, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 465.18, "r_x1": 286.37, "r_y1": 465.18, "r_x2": 286.37, "r_y2": 456.59, "r_x3": 50.11, "r_y3": 456.59, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 477.13, "r_x1": 286.37, "r_y1": 477.13, "r_x2": 286.37, "r_y2": 468.54, "r_x3": 50.11, "r_y3": 468.54, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 489.09, "r_x1": 286.37, "r_y1": 489.09, "r_x2": 286.37, "r_y2": 480.5, "r_x3": 50.11, "r_y3": 480.5, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.04, "r_x1": 286.37, "r_y1": 501.04, "r_x2": 286.37, "r_y2": 492.45, "r_x3": 50.11, "r_y3": 492.45, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 513.0, "r_x1": 276.65, "r_y1": 513.0, "r_x2": 276.65, "r_y2": 504.41, "r_x3": 50.11, "r_y3": 504.41, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables." }, { "label": "section_header", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 50.11, "t": 539.94, "r": 126.95, "b": 550.69, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.69, "r_x1": 58.12, "r_y1": 550.69, "r_x2": 58.12, "r_y2": 539.94, "r_x3": 50.11, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.8, "r_y0": 550.69, "r_x1": 126.95, "r_y1": 550.69, "r_x2": 126.95, "r_y2": 539.94, "r_x3": 68.8, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Introduction" }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 560.78, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 569.69, "r_x1": 286.36, "r_y1": 569.69, "r_x2": 286.36, "r_y2": 560.78, "r_x3": 62.07, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 76.4, "r_y1": 713.15, "r_x2": 76.4, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues." }, { "label": "section_header", "id": 14, "page_no": 0, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 315.57, "t": 218.01, "r": 408.44, "b": 226.75, "coord_origin": "TOPLEFT" }, "confidence": 0.672, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 226.75, "r_x1": 324.01, "r_y1": 226.75, "r_x2": 324.01, "r_y2": 218.01, "r_x3": 315.57, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.23, "r_y0": 226.75, "r_x1": 408.44, "r_y1": 226.75, "r_x2": 408.44, "r_y2": 218.01, "r_x3": 328.23, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a. Picture of a table:" }, { "label": "list_item", "id": 17, "page_no": 0, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 315.57, "t": 313.69, "r": 486.4, "b": 333.24, "coord_origin": "TOPLEFT" }, "confidence": 0.555, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 322.44, "r_x1": 325.06, "r_y1": 322.44, "r_x2": 325.06, "r_y2": 313.69, "r_x3": 315.57, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.8, "r_y0": 322.44, "r_x1": 486.4, "r_y1": 322.44, "r_x2": 486.4, "r_y2": 313.69, "r_x3": 329.8, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46, "r_y0": 333.24, "r_x1": 472.47, "r_y1": 333.24, "r_x2": 472.47, "r_y2": 324.49, "r_x3": 326.46, "r_y3": 324.49, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer" }, { "label": "list_item", "id": 18, "page_no": 0, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 315.57, "t": 420.18, "r": 491.19, "b": 428.93, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 428.93, "r_x1": 324.81, "r_y1": 428.93, "r_x2": 324.81, "r_y2": 420.18, "r_x3": 315.57, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.43, "r_y0": 428.93, "r_x1": 491.19, "r_y1": 428.93, "r_x2": 491.19, "r_y2": 420.18, "r_x3": 329.43, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "c. Structure predicted by TableFormer:" }, { "label": "picture", "id": 10, "page_no": 0, "cluster": { "id": 10, "label": "picture", "bbox": { "l": 314.78, "t": 338.07, "r": 539.18, "b": 410.05, "coord_origin": "TOPLEFT" }, "confidence": 0.874, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.15, "t": 342.83, "r": 412.54, "b": 351.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11, "t": 341.57, "r": 360.5, "b": 350.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.68, "t": 340.94, "r": 505.07, "b": 349.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13, "t": 351.75, "r": 360.53, "b": 360.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.54, "t": 355.88, "r": 406.93, "b": 364.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58, "t": 352.84, "r": 452.97, "b": 361.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65, "t": 353.71, "r": 496.04, "b": 362.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.14, "t": 353.34, "r": 539.53, "b": 362.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.83, "t": 387.1, "r": 353.22, "b": 395.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27, "t": 375.37, "r": 393.66, "b": 384.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67, "t": 375.65, "r": 451.46, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.44, "t": 375.53, "r": 485.9, "b": 384.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57, "t": 375.65, "r": 531.36, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.23, "t": 387.11, "r": 409.01, "b": 395.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.31, "t": 386.99, "r": 451.09, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.22, "t": 387.37, "r": 487.0, "b": 396.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.23, "t": 386.99, "r": 532.01, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57, "t": 399.42, "r": 415.96, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96, "t": 399.42, "r": 420.36, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.31, "t": 399.04, "r": 451.09, "b": 407.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.78, "t": 399.0, "r": 487.56, "b": 407.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97, "t": 398.61, "r": 532.76, "b": 407.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09, "t": 357.76, "r": 391.1, "b": 367.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43, "t": 380.73, "r": 339.44, "b": 390.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07, "t": 341.04, "r": 484.08, "b": 351.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 23, "page_no": 0, "cluster": { "id": 23, "label": "picture", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.509, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "picture", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "picture", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.609, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.652, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 308.86, "t": 514.5, "r": 545.12, "b": 559.27, "coord_origin": "TOPLEFT" }, "confidence": 0.921, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 523.41, "r_x1": 345.73, "r_y1": 523.41, "r_x2": 345.73, "r_y2": 514.5, "r_x3": 308.86, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18, "r_y0": 523.41, "r_x1": 545.12, "r_y1": 523.41, "r_x2": 545.12, "r_y2": 514.5, "r_x3": 353.18, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 535.36, "r_x1": 545.12, "r_y1": 535.36, "r_x2": 545.12, "r_y2": 526.46, "r_x3": 308.86, "r_y3": 526.46, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 547.32, "r_x1": 545.12, "r_y1": 547.32, "r_x2": 545.12, "r_y2": 538.41, "r_x3": 308.86, "r_y3": 538.41, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 559.27, "r_x1": 505.69, "r_y1": 559.27, "r_x2": 505.69, "r_y2": 550.37, "r_x3": 308.86, "r_y3": 550.37, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'." }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 584.41, "r": 545.12, "b": 665.05, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 593.32, "r_x1": 545.11, "r_y1": 593.32, "r_x2": 545.11, "r_y2": 584.41, "r_x3": 320.82, "r_y3": 584.41, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.27, "r_x1": 545.12, "r_y1": 605.27, "r_x2": 545.12, "r_y2": 596.36, "r_x3": 308.86, "r_y3": 596.36, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.23, "r_x1": 545.12, "r_y1": 617.23, "r_x2": 545.12, "r_y2": 608.32, "r_x3": 308.86, "r_y3": 608.32, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.18, "r_x1": 545.12, "r_y1": 629.18, "r_x2": 545.12, "r_y2": 620.27, "r_x3": 308.86, "r_y3": 620.27, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.14, "r_x1": 353.69, "r_y1": 641.14, "r_x2": 353.69, "r_y2": 632.23, "r_x3": 308.86, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11, "r_y0": 641.14, "r_x1": 374.67, "r_y1": 641.14, "r_x2": 374.67, "r_y2": 632.23, "r_x3": 362.11, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.36, "r_y0": 641.14, "r_x1": 545.12, "r_y1": 641.14, "r_x2": 545.12, "r_y2": 632.23, "r_x3": 377.36, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.09, "r_x1": 545.12, "r_y1": 653.09, "r_x2": 545.12, "r_y2": 644.19, "r_x3": 308.86, "r_y3": 644.19, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.05, "r_x1": 375.55, "r_y1": 665.05, "r_x2": 375.55, "r_y2": 656.14, "r_x3": 308.86, "r_y3": 656.14, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document." }, { "label": "text", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 668.38, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 320.82, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.11, "r_y1": 713.15, "r_x2": 545.11, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be" }, { "label": "page_footer", "id": 12, "page_no": 0, "cluster": { "id": 12, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.805, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1" }, { "label": "page_header", "id": 9, "page_no": 0, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 18.34, "t": 207.82, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 560.0, "r_x2": 36.34, "r_y2": 207.82, "r_x3": 18.34, "r_y3": 207.82, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022" } ], "body": [ { "label": "section_header", "id": 8, "page_no": 0, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 96.3, "t": 107.03, "r": 498.93, "b": 119.93, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.3, "r_y0": 119.93, "r_x1": 498.93, "r_y1": 119.93, "r_x2": 498.93, "r_y2": 107.03, "r_x3": 96.3, "r_y3": 107.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers." }, { "label": "section_header", "id": 13, "page_no": 0, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 142.48, "t": 146.69, "r": 452.75, "b": 171.32, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.48, "r_y0": 157.37, "r_x1": 452.75, "r_y1": 157.37, "r_x2": 452.75, "r_y2": 146.69, "r_x3": 142.48, "r_y3": 146.69, "coord_origin": "TOPLEFT" }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.92, "r_y0": 171.32, "r_x1": 332.31, "r_y1": 171.32, "r_x2": 332.31, "r_y2": 160.63, "r_x3": 262.92, "r_y3": 160.63, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research" }, { "label": "key_value_region", "id": 25, "page_no": 0, "cluster": { "id": 25, "label": "key_value_region", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.485, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 208.12, "t": 175.96, "r": 378.73, "b": 184.43, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.12, "r_y0": 184.43, "r_x1": 212.73, "r_y1": 184.43, "r_x2": 212.73, "r_y2": 175.96, "r_x3": 208.12, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.73, "r_y0": 184.0, "r_x1": 293.43, "r_y1": 184.0, "r_x2": 293.43, "r_y2": 177.08, "r_x3": 212.73, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "ahn,nli,mly,taa", "orig": "ahn,nli,mly,taa", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.43, "r_y0": 184.43, "r_x1": 298.04, "r_y1": 184.43, "r_x2": 298.04, "r_y2": 175.96, "r_x3": 293.43, "r_y3": 175.96, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.03, "r_y0": 184.0, "r_x1": 378.73, "r_y1": 184.0, "r_x2": 378.73, "r_y2": 177.08, "r_x3": 298.03, "r_y3": 177.08, "coord_origin": "TOPLEFT" }, "text": "@zurich.ibm.com", "orig": "@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 145.99, "t": 215.48, "r": 190.48, "b": 226.23, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 226.23, "r_x1": 190.48, "r_y1": 226.23, "r_x2": 190.48, "r_y2": 215.48, "r_x3": 145.99, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract" }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 241.4, "r": 286.37, "b": 513.0, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 249.98, "r_x1": 286.36, "r_y1": 249.98, "r_x2": 286.36, "r_y2": 241.4, "r_x3": 62.07, "r_y3": 241.4, "coord_origin": "TOPLEFT" }, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 261.94, "r_x1": 286.37, "r_y1": 261.94, "r_x2": 286.37, "r_y2": 253.35, "r_x3": 50.11, "r_y3": 253.35, "coord_origin": "TOPLEFT" }, "text": "pact representation. This content is extremely valuable for", "orig": "pact representation. This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 273.89, "r_x1": 286.37, "r_y1": 273.89, "r_x2": 286.37, "r_y2": 265.31, "r_x3": 50.11, "r_y3": 265.31, "coord_origin": "TOPLEFT" }, "text": "systems such as search engines, Knowledge Graph\u2019s, etc,", "orig": "systems such as search engines, Knowledge Graph\u2019s, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 285.85, "r_x1": 286.37, "r_y1": 285.85, "r_x2": 286.37, "r_y2": 277.26, "r_x3": 50.11, "r_y3": 277.26, "coord_origin": "TOPLEFT" }, "text": "since they enhance their predictive capabilities. Unfortu-", "orig": "since they enhance their predictive capabilities. Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 297.8, "r_x1": 286.37, "r_y1": 297.8, "r_x2": 286.37, "r_y2": 289.22, "r_x3": 50.11, "r_y3": 289.22, "coord_origin": "TOPLEFT" }, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 309.76, "r_x1": 286.37, "r_y1": 309.76, "r_x2": 286.37, "r_y2": 301.17, "r_x3": 50.11, "r_y3": 301.17, "coord_origin": "TOPLEFT" }, "text": "Furthermore, they can have complex column/row-header", "orig": "Furthermore, they can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 321.71, "r_x1": 286.37, "r_y1": 321.71, "r_x2": 286.37, "r_y2": 313.13, "r_x3": 50.11, "r_y3": 313.13, "coord_origin": "TOPLEFT" }, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 333.67, "r_x1": 286.37, "r_y1": 333.67, "r_x2": 286.37, "r_y2": 325.08, "r_x3": 50.11, "r_y3": 325.08, "coord_origin": "TOPLEFT" }, "text": "tion lines, missing entries, etc. As such, the correct iden-", "orig": "tion lines, missing entries, etc. As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 345.62, "r_x1": 286.37, "r_y1": 345.62, "r_x2": 286.37, "r_y2": 337.04, "r_x3": 50.11, "r_y3": 337.04, "coord_origin": "TOPLEFT" }, "text": "tification of the table-structure from an image is a non-", "orig": "tification of the table-structure from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 357.58, "r_x1": 286.37, "r_y1": 357.58, "r_x2": 286.37, "r_y2": 348.99, "r_x3": 50.11, "r_y3": 348.99, "coord_origin": "TOPLEFT" }, "text": "trivial task. In this paper, we present a new table-structure", "orig": "trivial task. In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 369.53, "r_x1": 286.37, "r_y1": 369.53, "r_x2": 286.37, "r_y2": 360.95, "r_x3": 50.11, "r_y3": 360.95, "coord_origin": "TOPLEFT" }, "text": "identification model. The latter improves the latest end-to-", "orig": "identification model. The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 381.49, "r_x1": 286.37, "r_y1": 381.49, "r_x2": 286.37, "r_y2": 372.9, "r_x3": 50.11, "r_y3": 372.9, "coord_origin": "TOPLEFT" }, "text": "end deep learning model (i.e. encoder-dual-decoder from", "orig": "end deep learning model (i.e. encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 393.44, "r_x1": 286.37, "r_y1": 393.44, "r_x2": 286.37, "r_y2": 384.86, "r_x3": 50.11, "r_y3": 384.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet) in two significant ways. First, we introduce a", "orig": "PubTabNet) in two significant ways. First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 405.4, "r_x1": 286.37, "r_y1": 405.4, "r_x2": 286.37, "r_y2": 396.81, "r_x3": 50.11, "r_y3": 396.81, "coord_origin": "TOPLEFT" }, "text": "new object detection decoder for table-cells. In this way,", "orig": "new object detection decoder for table-cells. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 417.35, "r_x1": 286.37, "r_y1": 417.35, "r_x2": 286.37, "r_y2": 408.77, "r_x3": 50.11, "r_y3": 408.77, "coord_origin": "TOPLEFT" }, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 429.31, "r_x1": 286.37, "r_y1": 429.31, "r_x2": 286.37, "r_y2": 420.72, "r_x3": 50.11, "r_y3": 420.72, "coord_origin": "TOPLEFT" }, "text": "matic PDF\u2019s directly from the PDF source and avoid the", "orig": "matic PDF\u2019s directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 441.27, "r_x1": 207.23, "r_y1": 441.27, "r_x2": 207.23, "r_y2": 432.68, "r_x3": 50.11, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.1, "r_y0": 441.27, "r_x1": 286.37, "r_y1": 441.27, "r_x2": 286.37, "r_y2": 432.68, "r_x3": 214.1, "r_y3": 432.68, "coord_origin": "TOPLEFT" }, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 453.22, "r_x1": 286.37, "r_y1": 453.22, "r_x2": 286.37, "r_y2": 444.63, "r_x3": 50.11, "r_y3": 444.63, "coord_origin": "TOPLEFT" }, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 465.18, "r_x1": 286.37, "r_y1": 465.18, "r_x2": 286.37, "r_y2": 456.59, "r_x3": 50.11, "r_y3": 456.59, "coord_origin": "TOPLEFT" }, "text": "allows us to tackle non-english tables. Second, we replace", "orig": "allows us to tackle non-english tables. Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 477.13, "r_x1": 286.37, "r_y1": 477.13, "r_x2": 286.37, "r_y2": 468.54, "r_x3": 50.11, "r_y3": 468.54, "coord_origin": "TOPLEFT" }, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 489.09, "r_x1": 286.37, "r_y1": 489.09, "r_x2": 286.37, "r_y2": 480.5, "r_x3": 50.11, "r_y3": 480.5, "coord_origin": "TOPLEFT" }, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.04, "r_x1": 286.37, "r_y1": 501.04, "r_x2": 286.37, "r_y2": 492.45, "r_x3": 50.11, "r_y3": 492.45, "coord_origin": "TOPLEFT" }, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 513.0, "r_x1": 276.65, "r_y1": 513.0, "r_x2": 276.65, "r_y2": 504.41, "r_x3": 50.11, "r_y3": 504.41, "coord_origin": "TOPLEFT" }, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables." }, { "label": "section_header", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 50.11, "t": 539.94, "r": 126.95, "b": 550.69, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.69, "r_x1": 58.12, "r_y1": 550.69, "r_x2": 58.12, "r_y2": 539.94, "r_x3": 50.11, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.8, "r_y0": 550.69, "r_x1": 126.95, "r_y1": 550.69, "r_x2": 126.95, "r_y2": 539.94, "r_x3": 68.8, "r_y3": 539.94, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Introduction" }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 560.78, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 569.69, "r_x1": 286.36, "r_y1": 569.69, "r_x2": 286.36, "r_y2": 560.78, "r_x3": 62.07, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "The occurrence of tables in documents is ubiquitous.", "orig": "The occurrence of tables in documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "tremely valuable. Unfortunately, this compact representa-", "orig": "tremely valuable. Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "table-entries. Fig. 1 shows a table which presents all these", "orig": "table-entries. Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 76.4, "r_y1": 713.15, "r_x2": 76.4, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues." }, { "label": "section_header", "id": 14, "page_no": 0, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 315.57, "t": 218.01, "r": 408.44, "b": 226.75, "coord_origin": "TOPLEFT" }, "confidence": 0.672, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 226.75, "r_x1": 324.01, "r_y1": 226.75, "r_x2": 324.01, "r_y2": 218.01, "r_x3": 315.57, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.23, "r_y0": 226.75, "r_x1": 408.44, "r_y1": 226.75, "r_x2": 408.44, "r_y2": 218.01, "r_x3": 328.23, "r_y3": 218.01, "coord_origin": "TOPLEFT" }, "text": "Picture of a table:", "orig": "Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a. Picture of a table:" }, { "label": "list_item", "id": 17, "page_no": 0, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 315.57, "t": 313.69, "r": 486.4, "b": 333.24, "coord_origin": "TOPLEFT" }, "confidence": 0.555, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 322.44, "r_x1": 325.06, "r_y1": 322.44, "r_x2": 325.06, "r_y2": 313.69, "r_x3": 315.57, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.8, "r_y0": 322.44, "r_x1": 486.4, "r_y1": 322.44, "r_x2": 486.4, "r_y2": 313.69, "r_x3": 329.8, "r_y3": 313.69, "coord_origin": "TOPLEFT" }, "text": "Red-annotation of bounding boxes,", "orig": "Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.46, "r_y0": 333.24, "r_x1": 472.47, "r_y1": 333.24, "r_x2": 472.47, "r_y2": 324.49, "r_x3": 326.46, "r_y3": 324.49, "coord_origin": "TOPLEFT" }, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer" }, { "label": "list_item", "id": 18, "page_no": 0, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 315.57, "t": 420.18, "r": 491.19, "b": 428.93, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.57, "r_y0": 428.93, "r_x1": 324.81, "r_y1": 428.93, "r_x2": 324.81, "r_y2": 420.18, "r_x3": 315.57, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "c.", "orig": "c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.43, "r_y0": 428.93, "r_x1": 491.19, "r_y1": 428.93, "r_x2": 491.19, "r_y2": 420.18, "r_x3": 329.43, "r_y3": 420.18, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer:", "orig": "Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "c. Structure predicted by TableFormer:" }, { "label": "picture", "id": 10, "page_no": 0, "cluster": { "id": 10, "label": "picture", "bbox": { "l": 314.78, "t": 338.07, "r": 539.18, "b": 410.05, "coord_origin": "TOPLEFT" }, "confidence": 0.874, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 40, "label": "text", "bbox": { "l": 408.15, "t": 342.83, "r": 412.54, "b": 351.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.15, "r_y0": 351.61, "r_x1": 412.54, "r_y1": 351.61, "r_x2": 412.54, "r_y2": 342.83, "r_x3": 408.15, "r_y3": 342.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 356.11, "t": 341.57, "r": 360.5, "b": 350.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.11, "r_y0": 350.36, "r_x1": 360.5, "r_y1": 350.36, "r_x2": 360.5, "r_y2": 341.57, "r_x3": 356.11, "r_y3": 341.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 500.68, "t": 340.94, "r": 505.07, "b": 349.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.68, "r_y0": 349.72, "r_x1": 505.07, "r_y1": 349.72, "r_x2": 505.07, "r_y2": 340.94, "r_x3": 500.68, "r_y3": 340.94, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 356.13, "t": 351.75, "r": 360.53, "b": 360.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.13, "r_y0": 360.53, "r_x1": 360.53, "r_y1": 360.53, "r_x2": 360.53, "r_y2": 351.75, "r_x3": 356.13, "r_y3": 351.75, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 402.54, "t": 355.88, "r": 406.93, "b": 364.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 402.54, "r_y0": 364.66, "r_x1": 406.93, "r_y1": 364.66, "r_x2": 406.93, "r_y2": 355.88, "r_x3": 402.54, "r_y3": 355.88, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 448.58, "t": 352.84, "r": 452.97, "b": 361.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.58, "r_y0": 361.63, "r_x1": 452.97, "r_y1": 361.63, "r_x2": 452.97, "r_y2": 352.84, "r_x3": 448.58, "r_y3": 352.84, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 491.65, "t": 353.71, "r": 496.04, "b": 362.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 491.65, "r_y0": 362.49, "r_x1": 496.04, "r_y1": 362.49, "r_x2": 496.04, "r_y2": 353.71, "r_x3": 491.65, "r_y3": 353.71, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 535.14, "t": 353.34, "r": 539.53, "b": 362.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 535.14, "r_y0": 362.12, "r_x1": 539.53, "r_y1": 362.12, "r_x2": 539.53, "r_y2": 353.34, "r_x3": 535.14, "r_y3": 353.34, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 348.83, "t": 387.1, "r": 353.22, "b": 395.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.83, "r_y0": 395.88, "r_x1": 353.22, "r_y1": 395.88, "r_x2": 353.22, "r_y2": 387.1, "r_x3": 348.83, "r_y3": 387.1, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 389.27, "t": 375.37, "r": 393.66, "b": 384.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.27, "r_y0": 384.16, "r_x1": 393.66, "r_y1": 384.16, "r_x2": 393.66, "r_y2": 375.37, "r_x3": 389.27, "r_y3": 375.37, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 442.67, "t": 375.65, "r": 451.46, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.67, "r_y0": 384.43, "r_x1": 451.46, "r_y1": 384.43, "r_x2": 451.46, "r_y2": 375.65, "r_x3": 442.67, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 477.44, "t": 375.53, "r": 485.9, "b": 384.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.44, "r_y0": 384.32, "r_x1": 485.9, "r_y1": 384.32, "r_x2": 485.9, "r_y2": 375.53, "r_x3": 477.44, "r_y3": 375.53, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 522.57, "t": 375.65, "r": 531.36, "b": 384.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 522.57, "r_y0": 384.43, "r_x1": 531.36, "r_y1": 384.43, "r_x2": 531.36, "r_y2": 375.65, "r_x3": 522.57, "r_y3": 375.65, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 400.23, "t": 387.11, "r": 409.01, "b": 395.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.23, "r_y0": 395.9, "r_x1": 409.01, "r_y1": 395.9, "r_x2": 409.01, "r_y2": 387.11, "r_x3": 400.23, "r_y3": 387.11, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 442.31, "t": 386.99, "r": 451.09, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 395.77, "r_x1": 451.09, "r_y1": 395.77, "r_x2": 451.09, "r_y2": 386.99, "r_x3": 442.31, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 478.22, "t": 387.37, "r": 487.0, "b": 396.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.22, "r_y0": 396.16, "r_x1": 487.0, "r_y1": 396.16, "r_x2": 487.0, "r_y2": 387.37, "r_x3": 478.22, "r_y3": 387.37, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 523.23, "t": 386.99, "r": 532.01, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.23, "r_y0": 395.77, "r_x1": 532.01, "r_y1": 395.77, "r_x2": 532.01, "r_y2": 386.99, "r_x3": 523.23, "r_y3": 386.99, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 411.57, "t": 399.42, "r": 415.96, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.57, "r_y0": 408.21, "r_x1": 415.96, "r_y1": 408.21, "r_x2": 415.96, "r_y2": 399.42, "r_x3": 411.57, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 415.96, "t": 399.42, "r": 420.36, "b": 408.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.96, "r_y0": 408.21, "r_x1": 420.36, "r_y1": 408.21, "r_x2": 420.36, "r_y2": 399.42, "r_x3": 415.96, "r_y3": 399.42, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 442.31, "t": 399.04, "r": 451.09, "b": 407.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.31, "r_y0": 407.82, "r_x1": 451.09, "r_y1": 407.82, "r_x2": 451.09, "r_y2": 399.04, "r_x3": 442.31, "r_y3": 399.04, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 478.78, "t": 399.0, "r": 487.56, "b": 407.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.78, "r_y0": 407.78, "r_x1": 487.56, "r_y1": 407.78, "r_x2": 487.56, "r_y2": 399.0, "r_x3": 478.78, "r_y3": 399.0, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 523.97, "t": 398.61, "r": 532.76, "b": 407.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 523.97, "r_y0": 407.4, "r_x1": 532.76, "r_y1": 407.4, "r_x2": 532.76, "r_y2": 398.61, "r_x3": 523.97, "r_y3": 398.61, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 385.09, "t": 357.76, "r": 391.1, "b": 367.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.09, "r_y0": 367.89, "r_x1": 391.1, "r_y1": 367.89, "r_x2": 391.1, "r_y2": 357.76, "r_x3": 385.09, "r_y3": 357.76, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 333.43, "t": 380.73, "r": 339.44, "b": 390.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 390.86, "r_x1": 339.44, "r_y1": 390.86, "r_x2": 339.44, "r_y2": 380.73, "r_x3": 333.43, "r_y3": 380.73, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 478.07, "t": 341.04, "r": 484.08, "b": 351.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.07, "r_y0": 351.17, "r_x1": 484.08, "r_y1": 351.17, "r_x2": 484.08, "r_y2": 341.04, "r_x3": 478.07, "r_y3": 341.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 23, "page_no": 0, "cluster": { "id": 23, "label": "picture", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.509, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 0, "cluster": { "id": 11, "label": "table", "bbox": { "l": 315.72, "t": 433.82, "r": 536.84, "b": 496.03, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 62, "label": "text", "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 446.47, "r_x1": 351.64, "r_y1": 446.47, "r_x2": 351.64, "r_y2": 437.69, "r_x3": 347.25, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.88, "r_y0": 446.47, "r_x1": 323.27, "r_y1": 446.47, "r_x2": 323.27, "r_y2": 437.69, "r_x3": 318.88, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 394.1, "t": 437.69, "r": 398.5, "b": 446.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 446.47, "r_x1": 398.5, "r_y1": 446.47, "r_x2": 398.5, "r_y2": 437.69, "r_x3": 394.1, "r_y3": 437.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 458.33, "r_x1": 323.17, "r_y1": 458.33, "r_x2": 323.17, "r_y2": 449.55, "r_x3": 318.77, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 347.25, "t": 449.55, "r": 351.64, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 458.33, "r_x1": 351.64, "r_y1": 458.33, "r_x2": 351.64, "r_y2": 449.55, "r_x3": 347.25, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 458.33, "r_x1": 398.5, "r_y1": 458.33, "r_x2": 398.5, "r_y2": 449.55, "r_x3": 394.1, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 458.33, "r_x1": 445.35, "r_y1": 458.33, "r_x2": 445.35, "r_y2": 449.55, "r_x3": 440.96, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 458.33, "r_x1": 492.21, "r_y1": 458.33, "r_x2": 492.21, "r_y2": 449.55, "r_x3": 487.81, "r_y3": 449.55, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 482.49, "r_x1": 323.17, "r_y1": 482.49, "r_x2": 323.17, "r_y2": 473.7, "r_x3": 318.77, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 470.63, "r_x1": 351.64, "r_y1": 470.63, "r_x2": 351.64, "r_y2": 461.84, "r_x3": 347.25, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 470.63, "r_x1": 402.89, "r_y1": 470.63, "r_x2": 402.89, "r_y2": 461.84, "r_x3": 394.1, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 470.63, "r_x1": 449.42, "r_y1": 470.63, "r_x2": 449.42, "r_y2": 461.84, "r_x3": 440.96, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 470.63, "r_x1": 496.6, "r_y1": 470.63, "r_x2": 496.6, "r_y2": 461.84, "r_x3": 487.81, "r_y3": 461.84, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 482.49, "r_x1": 356.03, "r_y1": 482.49, "r_x2": 356.03, "r_y2": 473.7, "r_x3": 347.25, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 482.49, "r_x1": 402.89, "r_y1": 482.49, "r_x2": 402.89, "r_y2": 473.7, "r_x3": 394.1, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 482.49, "r_x1": 449.74, "r_y1": 482.49, "r_x2": 449.74, "r_y2": 473.7, "r_x3": 440.96, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 482.49, "r_x1": 496.6, "r_y1": 482.49, "r_x2": 496.6, "r_y2": 473.7, "r_x3": 487.81, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.25, "r_y0": 493.91, "r_x1": 356.03, "r_y1": 493.91, "r_x2": 356.03, "r_y2": 485.12, "r_x3": 347.25, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.1, "r_y0": 493.91, "r_x1": 402.89, "r_y1": 493.91, "r_x2": 402.89, "r_y2": 485.12, "r_x3": 394.1, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.96, "r_y0": 493.91, "r_x1": 449.74, "r_y1": 493.91, "r_x2": 449.74, "r_y2": 485.12, "r_x3": 440.96, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 487.81, "r_y0": 493.91, "r_x1": 496.6, "r_y1": 493.91, "r_x2": 496.6, "r_y2": 485.12, "r_x3": 487.81, "r_y3": 485.12, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 366.7, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 366.7, "r_y0": 459.25, "r_x1": 372.71, "r_y1": 459.25, "r_x2": 372.71, "r_y2": 449.12, "r_x3": 366.7, "r_y3": 449.12, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 331.9, "t": 473.32, "r": 337.91, "b": 483.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.9, "r_y0": 483.45, "r_x1": 337.91, "r_y1": 483.45, "r_x2": 337.91, "r_y2": 473.32, "r_x3": 331.9, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 459.88, "t": 437.59, "r": 465.88, "b": 447.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.88, "r_y0": 447.72, "r_x1": 465.88, "r_y1": 447.72, "r_x2": 465.88, "r_y2": 437.59, "r_x3": 459.88, "r_y3": 437.59, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 5, "table_cells": [ { "bbox": { "l": 347.25, "t": 437.69, "r": 351.64, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.88, "t": 437.69, "r": 323.27, "b": 446.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 449.55, "r": 323.17, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 449.12, "r": 372.71, "b": 459.25, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 449.55, "r": 398.5, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 449.55, "r": 445.35, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 449.55, "r": 492.21, "b": 458.33, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 318.77, "t": 473.7, "r": 323.17, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 461.84, "r": 351.64, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 461.84, "r": 402.89, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 461.84, "r": 449.42, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 461.84, "r": 496.6, "b": 470.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 473.7, "r": 356.03, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 473.7, "r": 402.89, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 473.7, "r": 449.74, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 473.7, "r": 496.6, "b": 482.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 347.25, "t": 485.12, "r": 356.03, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.1, "t": 485.12, "r": 402.89, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 440.96, "t": 485.12, "r": 449.74, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 487.81, "t": 485.12, "r": 496.6, "b": 493.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "picture", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "picture", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.609, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 15, "page_no": 0, "cluster": { "id": 15, "label": "table", "bbox": { "l": 315.65, "t": 228.72, "r": 537.15, "b": 302.8, "coord_origin": "TOPLEFT" }, "confidence": 0.652, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.95, "r_y0": 245.48, "r_x1": 457.95, "r_y1": 245.48, "r_x2": 457.95, "r_y2": 235.35, "r_x3": 451.95, "r_y3": 235.35, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 331.2, "t": 269.35, "r": 337.2, "b": 279.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.2, "r_y0": 279.48, "r_x1": 337.2, "r_y1": 279.48, "r_x2": 337.2, "r_y2": 269.35, "r_x3": 331.2, "r_y3": 269.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 384.03, "t": 252.68, "r": 390.04, "b": 262.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.03, "r_y0": 262.81, "r_x1": 390.04, "r_y1": 262.81, "r_x2": 390.04, "r_y2": 252.68, "r_x3": 384.03, "r_y3": 252.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 1, "num_cols": 1, "table_cells": [ { "bbox": { "l": 451.95, "t": 235.35, "r": 457.95, "b": 245.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 308.86, "t": 514.5, "r": 545.12, "b": 559.27, "coord_origin": "TOPLEFT" }, "confidence": 0.921, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 523.41, "r_x1": 345.73, "r_y1": 523.41, "r_x2": 345.73, "r_y2": 514.5, "r_x3": 308.86, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.18, "r_y0": 523.41, "r_x1": 545.12, "r_y1": 523.41, "r_x2": 545.12, "r_y2": 514.5, "r_x3": 353.18, "r_y3": 514.5, "coord_origin": "TOPLEFT" }, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 535.36, "r_x1": 545.12, "r_y1": 535.36, "r_x2": 545.12, "r_y2": 526.46, "r_x3": 308.86, "r_y3": 526.46, "coord_origin": "TOPLEFT" }, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 547.32, "r_x1": 545.12, "r_y1": 547.32, "r_x2": 545.12, "r_y2": 538.41, "r_x3": 308.86, "r_y3": 538.41, "coord_origin": "TOPLEFT" }, "text": "text and (3) cells with no content. Image from PubTabNet", "orig": "text and (3) cells with no content. Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 559.27, "r_x1": 505.69, "r_y1": 559.27, "r_x2": 505.69, "r_y2": 550.37, "r_x3": 308.86, "r_y3": 550.37, "coord_origin": "TOPLEFT" }, "text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'." }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 584.41, "r": 545.12, "b": 665.05, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 593.32, "r_x1": 545.11, "r_y1": 593.32, "r_x2": 545.11, "r_y2": 584.41, "r_x3": 320.82, "r_y3": 584.41, "coord_origin": "TOPLEFT" }, "text": "Recently, significant progress has been made with vi-", "orig": "Recently, significant progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.27, "r_x1": 545.12, "r_y1": 605.27, "r_x2": 545.12, "r_y2": 596.36, "r_x3": 308.86, "r_y3": 596.36, "coord_origin": "TOPLEFT" }, "text": "sion based approaches to extract tables in documents. For", "orig": "sion based approaches to extract tables in documents. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.23, "r_x1": 545.12, "r_y1": 617.23, "r_x2": 545.12, "r_y2": 608.32, "r_x3": 308.86, "r_y3": 608.32, "coord_origin": "TOPLEFT" }, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.18, "r_x1": 545.12, "r_y1": 629.18, "r_x2": 545.12, "r_y2": 620.27, "r_x3": 308.86, "r_y3": 620.27, "coord_origin": "TOPLEFT" }, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.14, "r_x1": 353.69, "r_y1": 641.14, "r_x2": 353.69, "r_y2": 632.23, "r_x3": 308.86, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "lenges, i.e.", "orig": "lenges, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.11, "r_y0": 641.14, "r_x1": 374.67, "r_y1": 641.14, "r_x2": 374.67, "r_y2": 632.23, "r_x3": 362.11, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.36, "r_y0": 641.14, "r_x1": 545.12, "r_y1": 641.14, "r_x2": 545.12, "r_y2": 632.23, "r_x3": 377.36, "r_y3": 632.23, "coord_origin": "TOPLEFT" }, "text": "finding the location of the table(s) on a", "orig": "finding the location of the table(s) on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.09, "r_x1": 545.12, "r_y1": 653.09, "r_x2": 545.12, "r_y2": 644.19, "r_x3": 308.86, "r_y3": 644.19, "coord_origin": "TOPLEFT" }, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.05, "r_x1": 375.55, "r_y1": 665.05, "r_x2": 375.55, "r_y2": 656.14, "r_x3": 308.86, "r_y3": 656.14, "coord_origin": "TOPLEFT" }, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document." }, { "label": "text", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 668.38, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 320.82, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "of-the-art object-detection networks (e.g. YOLO and later", "orig": "of-the-art object-detection networks (e.g. YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.11, "r_y1": 713.15, "r_x2": 545.11, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "on Mask-RCNN [9]). For all practical purposes, it can be", "orig": "on Mask-RCNN [9]). For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be" } ], "headers": [ { "label": "page_footer", "id": 12, "page_no": 0, "cluster": { "id": 12, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.805, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1" }, { "label": "page_header", "id": 9, "page_no": 0, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 18.34, "t": 207.82, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 560.0, "r_x2": 36.34, "r_y2": 207.82, "r_x3": 18.34, "r_y3": 207.82, "coord_origin": "TOPLEFT" }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022" } ] } }, { "page_no": 1, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 112.65, "r_y1": 96.07, "r_x2": 112.65, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 108.48, "r_x1": 286.36, "r_y1": 108.48, "r_x2": 286.36, "r_y2": 99.57, "r_x3": 62.07, "r_y3": 99.57, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.43, "r_x1": 74.75, "r_y1": 120.43, "r_x2": 74.75, "r_y2": 111.53, "r_x3": 50.11, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.33, "r_y0": 120.43, "r_x1": 286.37, "r_y1": 120.43, "r_x2": 286.37, "r_y2": 111.53, "r_x3": 81.33, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 132.39, "r_x1": 286.37, "r_y1": 132.39, "r_x2": 286.37, "r_y2": 123.48, "r_x3": 50.11, "r_y3": 123.48, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 144.34, "r_x1": 286.37, "r_y1": 144.34, "r_x2": 286.37, "r_y2": 135.44, "r_x3": 50.11, "r_y3": 135.44, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 156.3, "r_x1": 286.37, "r_y1": 156.3, "r_x2": 286.37, "r_y2": 147.39, "r_x3": 50.11, "r_y3": 147.39, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 168.25, "r_x1": 286.37, "r_y1": 168.25, "r_x2": 286.37, "r_y2": 159.35, "r_x3": 50.11, "r_y3": 159.35, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.21, "r_x1": 286.37, "r_y1": 180.21, "r_x2": 286.37, "r_y2": 171.3, "r_x3": 50.11, "r_y3": 171.3, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.16, "r_x1": 286.37, "r_y1": 192.16, "r_x2": 286.37, "r_y2": 183.26, "r_x3": 50.11, "r_y3": 183.26, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.12, "r_x1": 286.37, "r_y1": 204.12, "r_x2": 286.37, "r_y2": 195.21, "r_x3": 50.11, "r_y3": 195.21, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.07, "r_x1": 286.37, "r_y1": 216.07, "r_x2": 286.37, "r_y2": 207.17, "r_x3": 50.11, "r_y3": 207.17, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.03, "r_x1": 278.66, "r_y1": 228.03, "r_x2": 278.66, "r_y2": 219.12, "r_x3": 50.11, "r_y3": 219.12, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 240.44, "r_x1": 286.36, "r_y1": 240.44, "r_x2": 286.36, "r_y2": 231.53, "r_x3": 62.07, "r_y3": 231.53, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 252.39, "r_x1": 286.37, "r_y1": 252.39, "r_x2": 286.37, "r_y2": 243.49, "r_x3": 50.11, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.35, "r_x1": 286.37, "r_y1": 264.35, "r_x2": 286.37, "r_y2": 255.44, "r_x3": 50.11, "r_y3": 255.44, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.3, "r_x1": 286.37, "r_y1": 276.3, "r_x2": 286.37, "r_y2": 267.4, "r_x3": 50.11, "r_y3": 267.4, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.26, "r_x1": 286.37, "r_y1": 288.26, "r_x2": 286.37, "r_y2": 279.35, "r_x3": 50.11, "r_y3": 279.35, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.21, "r_x1": 88.57, "r_y1": 300.21, "r_x2": 88.57, "r_y2": 291.31, "r_x3": 50.11, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.5, "r_y0": 300.21, "r_x1": 286.37, "r_y1": 300.21, "r_x2": 286.37, "r_y2": 291.31, "r_x3": 95.5, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.17, "r_x1": 286.37, "r_y1": 312.17, "r_x2": 286.37, "r_y2": 303.26, "r_x3": 50.11, "r_y3": 303.26, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.12, "r_x1": 286.37, "r_y1": 324.12, "r_x2": 286.37, "r_y2": 315.22, "r_x3": 50.11, "r_y3": 315.22, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.08, "r_x1": 286.37, "r_y1": 336.08, "r_x2": 286.37, "r_y2": 327.17, "r_x3": 50.11, "r_y3": 327.17, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.03, "r_x1": 286.37, "r_y1": 348.03, "r_x2": 286.37, "r_y2": 339.13, "r_x3": 50.11, "r_y3": 339.13, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.99, "r_x1": 286.37, "r_y1": 359.99, "r_x2": 286.37, "r_y2": 351.08, "r_x3": 50.11, "r_y3": 351.08, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.95, "r_x1": 76.95, "r_y1": 371.95, "r_x2": 76.95, "r_y2": 363.04, "r_x3": 50.11, "r_y3": 363.04, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 384.35, "r_x1": 286.36, "r_y1": 384.35, "r_x2": 286.36, "r_y2": 375.45, "r_x3": 62.07, "r_y3": 375.45, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.31, "r_x1": 120.99, "r_y1": 396.31, "r_x2": 120.99, "r_y2": 387.4, "r_x3": 50.11, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.9, "r_y0": 396.24, "r_x1": 179.73, "r_y1": 396.24, "r_x2": 179.73, "r_y2": 387.28, "r_x3": 123.9, "r_y3": 387.28, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.65, "r_y0": 396.31, "r_x1": 286.37, "r_y1": 396.31, "r_x2": 286.37, "r_y2": 387.4, "r_x3": 182.65, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.26, "r_x1": 181.76, "r_y1": 408.26, "r_x2": 181.76, "r_y2": 399.36, "r_x3": 50.11, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.1, "r_y0": 408.19, "r_x1": 240.2, "r_y1": 408.19, "r_x2": 240.2, "r_y2": 399.24, "r_x3": 184.1, "r_y3": 399.24, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.2, "r_y0": 408.26, "r_x1": 286.36, "r_y1": 408.26, "r_x2": 286.36, "r_y2": 399.36, "r_x3": 240.2, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.22, "r_x1": 286.37, "r_y1": 420.22, "r_x2": 286.37, "r_y2": 411.31, "r_x3": 50.11, "r_y3": 411.31, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.17, "r_x1": 82.52, "r_y1": 432.17, "r_x2": 82.52, "r_y2": 423.27, "r_x3": 50.11, "r_y3": 423.27, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 453.46, "r_x1": 70.74, "r_y1": 453.46, "r_x2": 70.74, "r_y2": 444.55, "r_x3": 61.57, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.03, "r_y0": 453.46, "r_x1": 117.1, "r_y1": 453.46, "r_x2": 117.1, "r_y2": 444.55, "r_x3": 73.03, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59, "r_y0": 453.39, "r_x1": 175.42, "r_y1": 453.39, "r_x2": 175.42, "r_y2": 444.43, "r_x3": 119.59, "r_y3": 444.43, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42, "r_y0": 453.46, "r_x1": 286.36, "r_y1": 453.46, "r_x2": 286.36, "r_y2": 444.55, "r_x3": 175.42, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 465.41, "r_x1": 286.36, "r_y1": 465.41, "r_x2": 286.36, "r_y2": 456.51, "r_x3": 70.04, "r_y3": 456.51, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 477.37, "r_x1": 286.36, "r_y1": 477.37, "r_x2": 286.36, "r_y2": 468.46, "r_x3": 70.04, "r_y3": 468.46, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 489.32, "r_x1": 99.64, "r_y1": 489.32, "r_x2": 99.64, "r_y2": 480.42, "r_x3": 70.04, "r_y3": 480.42, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 511.06, "r_x1": 71.62, "r_y1": 511.06, "r_x2": 71.62, "r_y2": 502.15, "r_x3": 61.57, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.13, "r_y0": 511.06, "r_x1": 196.1, "r_y1": 511.06, "r_x2": 196.1, "r_y2": 502.15, "r_x3": 74.13, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.03, "r_x3": 200.31, "r_y3": 502.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35, "r_y0": 511.06, "r_x1": 286.36, "r_y1": 511.06, "r_x2": 286.36, "r_y2": 502.15, "r_x3": 260.35, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 523.01, "r_x1": 286.36, "r_y1": 523.01, "r_x2": 286.36, "r_y2": 514.11, "r_x3": 70.04, "r_y3": 514.11, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 534.97, "r_x1": 286.36, "r_y1": 534.97, "r_x2": 286.36, "r_y2": 526.06, "r_x3": 70.04, "r_y3": 526.06, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 546.93, "r_x1": 161.65, "r_y1": 546.93, "r_x2": 161.65, "r_y2": 538.02, "r_x3": 70.04, "r_y3": 538.02, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 568.66, "r_x1": 71.12, "r_y1": 568.66, "r_x2": 71.12, "r_y2": 559.76, "r_x3": 61.57, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.5, "r_y0": 568.66, "r_x1": 116.71, "r_y1": 568.66, "r_x2": 116.71, "r_y2": 559.76, "r_x3": 73.5, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.58, "r_y0": 568.59, "r_x1": 177.68, "r_y1": 568.59, "r_x2": 177.68, "r_y2": 559.64, "r_x3": 121.58, "r_y3": 559.64, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55, "r_y0": 568.66, "r_x1": 286.36, "r_y1": 568.66, "r_x2": 286.36, "r_y2": 559.76, "r_x3": 182.55, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 580.62, "r_x1": 286.36, "r_y1": 580.62, "r_x2": 286.36, "r_y2": 571.71, "r_x3": 70.04, "r_y3": 571.71, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 592.57, "r_x1": 82.4, "r_y1": 592.57, "r_x2": 82.4, "r_y2": 583.67, "r_x3": 70.04, "r_y3": 583.67, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 614.31, "r_x1": 72.33, "r_y1": 614.31, "r_x2": 72.33, "r_y2": 605.4, "r_x3": 61.57, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.02, "r_y0": 614.31, "r_x1": 286.37, "r_y1": 614.31, "r_x2": 286.37, "r_y2": 605.4, "r_x3": 75.02, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 626.26, "r_x1": 286.36, "r_y1": 626.26, "r_x2": 286.36, "r_y2": 617.36, "r_x3": 70.04, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 638.22, "r_x1": 198.06, "r_y1": 638.22, "r_x2": 198.06, "r_y2": 629.31, "r_x3": 70.04, "r_y3": 629.31, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 659.5, "r_x1": 286.36, "r_y1": 659.5, "r_x2": 286.36, "r_y2": 650.6, "r_x3": 62.07, "r_y3": 650.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 671.46, "r_x1": 286.37, "r_y1": 671.46, "r_x2": 286.37, "r_y2": 662.55, "r_x3": 50.11, "r_y3": 662.55, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 683.41, "r_x1": 286.37, "r_y1": 683.41, "r_x2": 286.37, "r_y2": 674.51, "r_x3": 50.11, "r_y3": 674.51, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 695.37, "r_x1": 286.37, "r_y1": 695.37, "r_x2": 286.37, "r_y2": 686.46, "r_x3": 50.11, "r_y3": 686.46, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97, "r_y0": 712.72, "r_x1": 183.73, "r_y1": 712.72, "r_x2": 183.73, "r_y2": 705.6, "r_x3": 60.97, "r_y3": 705.6, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 508.08, "r_y1": 108.02, "r_x2": 508.08, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 132.48, "r_x1": 315.58, "r_y1": 132.48, "r_x2": 315.58, "r_y2": 121.73, "r_x3": 308.86, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54, "r_y0": 132.48, "r_x1": 498.28, "r_y1": 132.48, "r_x2": 498.28, "r_y2": 121.73, "r_x3": 324.54, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 151.13, "r_x1": 545.11, "r_y1": 151.13, "r_x2": 545.11, "r_y2": 142.22, "r_x3": 320.82, "r_y3": 142.22, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 163.08, "r_x1": 545.12, "r_y1": 163.08, "r_x2": 545.12, "r_y2": 154.18, "r_x3": 308.86, "r_y3": 154.18, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 175.04, "r_x1": 522.56, "r_y1": 175.04, "r_x2": 522.56, "r_y2": 166.13, "r_x3": 308.86, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 175.04, "r_x1": 545.12, "r_y1": 175.04, "r_x2": 545.12, "r_y2": 166.13, "r_x3": 529.62, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 186.99, "r_x1": 545.12, "r_y1": 186.99, "r_x2": 545.12, "r_y2": 178.09, "r_x3": 308.86, "r_y3": 178.09, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 198.95, "r_x1": 545.12, "r_y1": 198.95, "r_x2": 545.12, "r_y2": 190.04, "r_x3": 308.86, "r_y3": 190.04, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 210.9, "r_x1": 346.98, "r_y1": 210.9, "r_x2": 346.98, "r_y2": 202.0, "r_x3": 308.86, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.87, "r_y0": 210.9, "r_x1": 545.12, "r_y1": 210.9, "r_x2": 545.12, "r_y2": 202.0, "r_x3": 354.87, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 222.86, "r_x1": 545.12, "r_y1": 222.86, "r_x2": 545.12, "r_y2": 213.95, "r_x3": 308.86, "r_y3": 213.95, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 234.81, "r_x1": 530.92, "r_y1": 234.81, "r_x2": 530.92, "r_y2": 225.91, "r_x3": 308.86, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92, "r_y0": 234.81, "r_x1": 545.12, "r_y1": 234.81, "r_x2": 545.12, "r_y2": 225.91, "r_x3": 537.92, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 246.77, "r_x1": 545.12, "r_y1": 246.77, "r_x2": 545.12, "r_y2": 237.86, "r_x3": 308.86, "r_y3": 237.86, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.72, "r_x1": 545.12, "r_y1": 258.72, "r_x2": 545.12, "r_y2": 249.82, "r_x3": 308.86, "r_y3": 249.82, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.68, "r_x1": 439.84, "r_y1": 270.68, "r_x2": 439.84, "r_y2": 261.77, "r_x3": 308.86, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.44, "r_y0": 270.46, "r_x1": 452.19, "r_y1": 270.46, "r_x2": 452.19, "r_y2": 261.61, "r_x3": 444.44, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89, "r_y0": 270.46, "r_x1": 470.83, "r_y1": 270.46, "r_x2": 470.83, "r_y2": 261.61, "r_x3": 455.89, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83, "r_y0": 270.68, "r_x1": 545.12, "r_y1": 270.68, "r_x2": 545.12, "r_y2": 261.77, "r_x3": 470.83, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.63, "r_x1": 545.12, "r_y1": 282.63, "r_x2": 545.12, "r_y2": 273.73, "r_x3": 308.86, "r_y3": 273.73, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.59, "r_x1": 545.12, "r_y1": 294.59, "r_x2": 545.12, "r_y2": 285.68, "r_x3": 308.86, "r_y3": 285.68, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 306.55, "r_x1": 545.12, "r_y1": 306.55, "r_x2": 545.12, "r_y2": 297.64, "r_x3": 308.86, "r_y3": 297.64, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.5, "r_x1": 545.12, "r_y1": 318.5, "r_x2": 545.12, "r_y2": 309.59, "r_x3": 308.86, "r_y3": 309.59, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.46, "r_x1": 425.92, "r_y1": 330.46, "r_x2": 425.92, "r_y2": 321.55, "r_x3": 308.86, "r_y3": 321.55, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 342.48, "r_x1": 545.11, "r_y1": 342.48, "r_x2": 545.11, "r_y2": 333.57, "r_x3": 320.82, "r_y3": 333.57, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.43, "r_x1": 545.11, "r_y1": 354.43, "r_x2": 545.11, "r_y2": 345.52, "r_x3": 308.86, "r_y3": 345.52, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.39, "r_x1": 545.12, "r_y1": 366.39, "r_x2": 545.12, "r_y2": 357.48, "r_x3": 308.86, "r_y3": 357.48, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.34, "r_x1": 545.12, "r_y1": 378.34, "r_x2": 545.12, "r_y2": 369.44, "r_x3": 308.86, "r_y3": 369.44, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.3, "r_x1": 545.12, "r_y1": 390.3, "r_x2": 545.12, "r_y2": 381.39, "r_x3": 308.86, "r_y3": 381.39, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.25, "r_x1": 545.12, "r_y1": 402.25, "r_x2": 545.12, "r_y2": 393.35, "r_x3": 308.86, "r_y3": 393.35, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 414.21, "r_x1": 545.12, "r_y1": 414.21, "r_x2": 545.12, "r_y2": 405.3, "r_x3": 308.86, "r_y3": 405.3, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 426.16, "r_x1": 545.12, "r_y1": 426.16, "r_x2": 545.12, "r_y2": 417.26, "r_x3": 308.86, "r_y3": 417.26, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 438.12, "r_x1": 545.12, "r_y1": 438.12, "r_x2": 545.12, "r_y2": 429.21, "r_x3": 308.86, "r_y3": 429.21, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 450.07, "r_x1": 401.29, "r_y1": 450.07, "r_x2": 401.29, "r_y2": 441.17, "r_x3": 308.86, "r_y3": 441.17, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 462.02, "r_x1": 423.26, "r_y1": 462.02, "r_x2": 423.26, "r_y2": 453.07, "r_x3": 320.82, "r_y3": 453.07, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.27, "r_y0": 462.09, "r_x1": 545.11, "r_y1": 462.09, "r_x2": 545.11, "r_y2": 453.19, "r_x3": 423.27, "r_y3": 453.19, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 474.05, "r_x1": 545.12, "r_y1": 474.05, "r_x2": 545.12, "r_y2": 465.14, "r_x3": 308.86, "r_y3": 465.14, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 486.0, "r_x1": 335.7, "r_y1": 486.0, "r_x2": 335.7, "r_y2": 477.1, "r_x3": 308.86, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85, "r_y0": 486.0, "r_x1": 545.12, "r_y1": 486.0, "r_x2": 545.12, "r_y2": 477.1, "r_x3": 345.85, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.96, "r_x1": 545.11, "r_y1": 497.96, "r_x2": 545.11, "r_y2": 489.05, "r_x3": 308.86, "r_y3": 489.05, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.91, "r_x1": 545.11, "r_y1": 509.91, "r_x2": 545.11, "r_y2": 501.01, "r_x3": 308.86, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.87, "r_x1": 545.12, "r_y1": 521.87, "r_x2": 545.12, "r_y2": 512.96, "r_x3": 308.86, "r_y3": 512.96, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.82, "r_x1": 545.12, "r_y1": 533.82, "r_x2": 545.12, "r_y2": 524.92, "r_x3": 308.86, "r_y3": 524.92, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.78, "r_x1": 420.94, "r_y1": 545.78, "r_x2": 420.94, "r_y2": 536.87, "r_x3": 308.86, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59, "r_y0": 545.56, "r_x1": 433.56, "r_y1": 545.56, "r_x2": 433.56, "r_y2": 536.16, "r_x3": 423.59, "r_y3": 536.16, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21, "r_y0": 545.78, "r_x1": 545.11, "r_y1": 545.78, "r_x2": 545.11, "r_y2": 536.87, "r_x3": 436.21, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.73, "r_x1": 545.12, "r_y1": 557.73, "r_x2": 545.12, "r_y2": 548.83, "r_x3": 308.86, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.69, "r_x1": 545.11, "r_y1": 569.69, "r_x2": 545.11, "r_y2": 560.78, "r_x3": 308.86, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.64, "r_x1": 545.11, "r_y1": 581.64, "r_x2": 545.11, "r_y2": 572.74, "r_x3": 308.86, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.6, "r_x1": 545.12, "r_y1": 593.6, "r_x2": 545.12, "r_y2": 584.69, "r_x3": 308.86, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.56, "r_x1": 497.08, "r_y1": 605.56, "r_x2": 497.08, "r_y2": 596.65, "r_x3": 308.86, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.8, "r_y0": 605.34, "r_x1": 509.77, "r_y1": 605.34, "r_x2": 509.77, "r_y2": 595.93, "r_x3": 499.8, "r_y3": 595.93, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.5, "r_y0": 605.56, "r_x1": 545.11, "r_y1": 605.56, "r_x2": 545.11, "r_y2": 596.65, "r_x3": 512.5, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.51, "r_x1": 545.12, "r_y1": 617.51, "r_x2": 545.12, "r_y2": 608.6, "r_x3": 308.86, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.47, "r_x1": 545.12, "r_y1": 629.47, "r_x2": 545.12, "r_y2": 620.56, "r_x3": 308.86, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.42, "r_x1": 364.78, "r_y1": 641.42, "r_x2": 364.78, "r_y2": 632.51, "r_x3": 308.86, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57, "r_y0": 641.19, "r_x1": 415.61, "r_y1": 641.19, "r_x2": 415.61, "r_y2": 632.6, "r_x3": 367.57, "r_y3": 632.6, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61, "r_y0": 641.42, "r_x1": 545.12, "r_y1": 641.42, "r_x2": 545.12, "r_y2": 632.51, "r_x3": 415.61, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.1, "r_x1": 373.6, "r_y1": 665.1, "r_x2": 373.6, "r_y2": 656.51, "r_x3": 308.86, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.91, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.43, "r_x3": 376.91, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.01, "r_x1": 356.9, "r_y1": 689.01, "r_x2": 356.9, "r_y2": 680.42, "r_x3": 308.86, "r_y3": 680.42, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 357.13, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 12, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 112.65, "r_y1": 96.07, "r_x2": 112.65, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 99.57, "r": 286.37, "b": 228.03, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 108.48, "r_x1": 286.36, "r_y1": 108.48, "r_x2": 286.36, "r_y2": 99.57, "r_x3": 62.07, "r_y3": 99.57, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.43, "r_x1": 74.75, "r_y1": 120.43, "r_x2": 74.75, "r_y2": 111.53, "r_x3": 50.11, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.33, "r_y0": 120.43, "r_x1": 286.37, "r_y1": 120.43, "r_x2": 286.37, "r_y2": 111.53, "r_x3": 81.33, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 132.39, "r_x1": 286.37, "r_y1": 132.39, "r_x2": 286.37, "r_y2": 123.48, "r_x3": 50.11, "r_y3": 123.48, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 144.34, "r_x1": 286.37, "r_y1": 144.34, "r_x2": 286.37, "r_y2": 135.44, "r_x3": 50.11, "r_y3": 135.44, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 156.3, "r_x1": 286.37, "r_y1": 156.3, "r_x2": 286.37, "r_y2": 147.39, "r_x3": 50.11, "r_y3": 147.39, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 168.25, "r_x1": 286.37, "r_y1": 168.25, "r_x2": 286.37, "r_y2": 159.35, "r_x3": 50.11, "r_y3": 159.35, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.21, "r_x1": 286.37, "r_y1": 180.21, "r_x2": 286.37, "r_y2": 171.3, "r_x3": 50.11, "r_y3": 171.3, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.16, "r_x1": 286.37, "r_y1": 192.16, "r_x2": 286.37, "r_y2": 183.26, "r_x3": 50.11, "r_y3": 183.26, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.12, "r_x1": 286.37, "r_y1": 204.12, "r_x2": 286.37, "r_y2": 195.21, "r_x3": 50.11, "r_y3": 195.21, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.07, "r_x1": 286.37, "r_y1": 216.07, "r_x2": 286.37, "r_y2": 207.17, "r_x3": 50.11, "r_y3": 207.17, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.03, "r_x1": 278.66, "r_y1": 228.03, "r_x2": 278.66, "r_y2": 219.12, "r_x3": 50.11, "r_y3": 219.12, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 231.53, "r": 286.37, "b": 371.95, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 240.44, "r_x1": 286.36, "r_y1": 240.44, "r_x2": 286.36, "r_y2": 231.53, "r_x3": 62.07, "r_y3": 231.53, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 252.39, "r_x1": 286.37, "r_y1": 252.39, "r_x2": 286.37, "r_y2": 243.49, "r_x3": 50.11, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.35, "r_x1": 286.37, "r_y1": 264.35, "r_x2": 286.37, "r_y2": 255.44, "r_x3": 50.11, "r_y3": 255.44, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.3, "r_x1": 286.37, "r_y1": 276.3, "r_x2": 286.37, "r_y2": 267.4, "r_x3": 50.11, "r_y3": 267.4, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.26, "r_x1": 286.37, "r_y1": 288.26, "r_x2": 286.37, "r_y2": 279.35, "r_x3": 50.11, "r_y3": 279.35, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.21, "r_x1": 88.57, "r_y1": 300.21, "r_x2": 88.57, "r_y2": 291.31, "r_x3": 50.11, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.5, "r_y0": 300.21, "r_x1": 286.37, "r_y1": 300.21, "r_x2": 286.37, "r_y2": 291.31, "r_x3": 95.5, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.17, "r_x1": 286.37, "r_y1": 312.17, "r_x2": 286.37, "r_y2": 303.26, "r_x3": 50.11, "r_y3": 303.26, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.12, "r_x1": 286.37, "r_y1": 324.12, "r_x2": 286.37, "r_y2": 315.22, "r_x3": 50.11, "r_y3": 315.22, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.08, "r_x1": 286.37, "r_y1": 336.08, "r_x2": 286.37, "r_y2": 327.17, "r_x3": 50.11, "r_y3": 327.17, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.03, "r_x1": 286.37, "r_y1": 348.03, "r_x2": 286.37, "r_y2": 339.13, "r_x3": 50.11, "r_y3": 339.13, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.99, "r_x1": 286.37, "r_y1": 359.99, "r_x2": 286.37, "r_y2": 351.08, "r_x3": 50.11, "r_y3": 351.08, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.95, "r_x1": 76.95, "r_y1": 371.95, "r_x2": 76.95, "r_y2": 363.04, "r_x3": 50.11, "r_y3": 363.04, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 375.45, "r": 286.37, "b": 432.17, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 384.35, "r_x1": 286.36, "r_y1": 384.35, "r_x2": 286.36, "r_y2": 375.45, "r_x3": 62.07, "r_y3": 375.45, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.31, "r_x1": 120.99, "r_y1": 396.31, "r_x2": 120.99, "r_y2": 387.4, "r_x3": 50.11, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.9, "r_y0": 396.24, "r_x1": 179.73, "r_y1": 396.24, "r_x2": 179.73, "r_y2": 387.28, "r_x3": 123.9, "r_y3": 387.28, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.65, "r_y0": 396.31, "r_x1": 286.37, "r_y1": 396.31, "r_x2": 286.37, "r_y2": 387.4, "r_x3": 182.65, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.26, "r_x1": 181.76, "r_y1": 408.26, "r_x2": 181.76, "r_y2": 399.36, "r_x3": 50.11, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.1, "r_y0": 408.19, "r_x1": 240.2, "r_y1": 408.19, "r_x2": 240.2, "r_y2": 399.24, "r_x3": 184.1, "r_y3": 399.24, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.2, "r_y0": 408.26, "r_x1": 286.36, "r_y1": 408.26, "r_x2": 286.36, "r_y2": 399.36, "r_x3": 240.2, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.22, "r_x1": 286.37, "r_y1": 420.22, "r_x2": 286.37, "r_y2": 411.31, "r_x3": 50.11, "r_y3": 411.31, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.17, "r_x1": 82.52, "r_y1": 432.17, "r_x2": 82.52, "r_y2": 423.27, "r_x3": 50.11, "r_y3": 423.27, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 61.57, "t": 444.43, "r": 286.36, "b": 489.32, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 453.46, "r_x1": 70.74, "r_y1": 453.46, "r_x2": 70.74, "r_y2": 444.55, "r_x3": 61.57, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.03, "r_y0": 453.46, "r_x1": 117.1, "r_y1": 453.46, "r_x2": 117.1, "r_y2": 444.55, "r_x3": 73.03, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59, "r_y0": 453.39, "r_x1": 175.42, "r_y1": 453.39, "r_x2": 175.42, "r_y2": 444.43, "r_x3": 119.59, "r_y3": 444.43, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42, "r_y0": 453.46, "r_x1": 286.36, "r_y1": 453.46, "r_x2": 286.36, "r_y2": 444.55, "r_x3": 175.42, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 465.41, "r_x1": 286.36, "r_y1": 465.41, "r_x2": 286.36, "r_y2": 456.51, "r_x3": 70.04, "r_y3": 456.51, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 477.37, "r_x1": 286.36, "r_y1": 477.37, "r_x2": 286.36, "r_y2": 468.46, "r_x3": 70.04, "r_y3": 468.46, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 489.32, "r_x1": 99.64, "r_y1": 489.32, "r_x2": 99.64, "r_y2": 480.42, "r_x3": 70.04, "r_y3": 480.42, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 61.57, "t": 502.03, "r": 286.36, "b": 546.93, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 511.06, "r_x1": 71.62, "r_y1": 511.06, "r_x2": 71.62, "r_y2": 502.15, "r_x3": 61.57, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.13, "r_y0": 511.06, "r_x1": 196.1, "r_y1": 511.06, "r_x2": 196.1, "r_y2": 502.15, "r_x3": 74.13, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.03, "r_x3": 200.31, "r_y3": 502.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35, "r_y0": 511.06, "r_x1": 286.36, "r_y1": 511.06, "r_x2": 286.36, "r_y2": 502.15, "r_x3": 260.35, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 523.01, "r_x1": 286.36, "r_y1": 523.01, "r_x2": 286.36, "r_y2": 514.11, "r_x3": 70.04, "r_y3": 514.11, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 534.97, "r_x1": 286.36, "r_y1": 534.97, "r_x2": 286.36, "r_y2": 526.06, "r_x3": 70.04, "r_y3": 526.06, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 546.93, "r_x1": 161.65, "r_y1": 546.93, "r_x2": 161.65, "r_y2": 538.02, "r_x3": 70.04, "r_y3": 538.02, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 61.57, "t": 559.64, "r": 286.36, "b": 592.57, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 568.66, "r_x1": 71.12, "r_y1": 568.66, "r_x2": 71.12, "r_y2": 559.76, "r_x3": 61.57, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.5, "r_y0": 568.66, "r_x1": 116.71, "r_y1": 568.66, "r_x2": 116.71, "r_y2": 559.76, "r_x3": 73.5, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.58, "r_y0": 568.59, "r_x1": 177.68, "r_y1": 568.59, "r_x2": 177.68, "r_y2": 559.64, "r_x3": 121.58, "r_y3": 559.64, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55, "r_y0": 568.66, "r_x1": 286.36, "r_y1": 568.66, "r_x2": 286.36, "r_y2": 559.76, "r_x3": 182.55, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 580.62, "r_x1": 286.36, "r_y1": 580.62, "r_x2": 286.36, "r_y2": 571.71, "r_x3": 70.04, "r_y3": 571.71, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 592.57, "r_x1": 82.4, "r_y1": 592.57, "r_x2": 82.4, "r_y2": 583.67, "r_x3": 70.04, "r_y3": 583.67, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 61.57, "t": 605.4, "r": 286.37, "b": 638.22, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 614.31, "r_x1": 72.33, "r_y1": 614.31, "r_x2": 72.33, "r_y2": 605.4, "r_x3": 61.57, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.02, "r_y0": 614.31, "r_x1": 286.37, "r_y1": 614.31, "r_x2": 286.37, "r_y2": 605.4, "r_x3": 75.02, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 626.26, "r_x1": 286.36, "r_y1": 626.26, "r_x2": 286.36, "r_y2": 617.36, "r_x3": 70.04, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 638.22, "r_x1": 198.06, "r_y1": 638.22, "r_x2": 198.06, "r_y2": 629.31, "r_x3": 70.04, "r_y3": 629.31, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 650.6, "r": 286.37, "b": 695.37, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 659.5, "r_x1": 286.36, "r_y1": 659.5, "r_x2": 286.36, "r_y2": 650.6, "r_x3": 62.07, "r_y3": 650.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 671.46, "r_x1": 286.37, "r_y1": 671.46, "r_x2": 286.37, "r_y2": 662.55, "r_x3": 50.11, "r_y3": 662.55, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 683.41, "r_x1": 286.37, "r_y1": 683.41, "r_x2": 286.37, "r_y2": 674.51, "r_x3": 50.11, "r_y3": 674.51, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 695.37, "r_x1": 286.37, "r_y1": 695.37, "r_x2": 286.37, "r_y2": 686.46, "r_x3": 50.11, "r_y3": 686.46, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "footnote", "bbox": { "l": 60.97, "t": 705.6, "r": 183.73, "b": 712.72, "coord_origin": "TOPLEFT" }, "confidence": 0.895, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97, "r_y0": 712.72, "r_x1": 183.73, "r_y1": 712.72, "r_x2": 183.73, "r_y2": 705.6, "r_x3": 60.97, "r_y3": 705.6, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 508.08, "r_y1": 108.02, "r_x2": 508.08, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 308.86, "t": 121.73, "r": 498.28, "b": 132.48, "coord_origin": "TOPLEFT" }, "confidence": 0.943, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 132.48, "r_x1": 315.58, "r_y1": 132.48, "r_x2": 315.58, "r_y2": 121.73, "r_x3": 308.86, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54, "r_y0": 132.48, "r_x1": 498.28, "r_y1": 132.48, "r_x2": 498.28, "r_y2": 121.73, "r_x3": 324.54, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 142.22, "r": 545.12, "b": 330.46, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 151.13, "r_x1": 545.11, "r_y1": 151.13, "r_x2": 545.11, "r_y2": 142.22, "r_x3": 320.82, "r_y3": 142.22, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 163.08, "r_x1": 545.12, "r_y1": 163.08, "r_x2": 545.12, "r_y2": 154.18, "r_x3": 308.86, "r_y3": 154.18, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 175.04, "r_x1": 522.56, "r_y1": 175.04, "r_x2": 522.56, "r_y2": 166.13, "r_x3": 308.86, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 175.04, "r_x1": 545.12, "r_y1": 175.04, "r_x2": 545.12, "r_y2": 166.13, "r_x3": 529.62, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 186.99, "r_x1": 545.12, "r_y1": 186.99, "r_x2": 545.12, "r_y2": 178.09, "r_x3": 308.86, "r_y3": 178.09, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 198.95, "r_x1": 545.12, "r_y1": 198.95, "r_x2": 545.12, "r_y2": 190.04, "r_x3": 308.86, "r_y3": 190.04, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 210.9, "r_x1": 346.98, "r_y1": 210.9, "r_x2": 346.98, "r_y2": 202.0, "r_x3": 308.86, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.87, "r_y0": 210.9, "r_x1": 545.12, "r_y1": 210.9, "r_x2": 545.12, "r_y2": 202.0, "r_x3": 354.87, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 222.86, "r_x1": 545.12, "r_y1": 222.86, "r_x2": 545.12, "r_y2": 213.95, "r_x3": 308.86, "r_y3": 213.95, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 234.81, "r_x1": 530.92, "r_y1": 234.81, "r_x2": 530.92, "r_y2": 225.91, "r_x3": 308.86, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92, "r_y0": 234.81, "r_x1": 545.12, "r_y1": 234.81, "r_x2": 545.12, "r_y2": 225.91, "r_x3": 537.92, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 246.77, "r_x1": 545.12, "r_y1": 246.77, "r_x2": 545.12, "r_y2": 237.86, "r_x3": 308.86, "r_y3": 237.86, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.72, "r_x1": 545.12, "r_y1": 258.72, "r_x2": 545.12, "r_y2": 249.82, "r_x3": 308.86, "r_y3": 249.82, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.68, "r_x1": 439.84, "r_y1": 270.68, "r_x2": 439.84, "r_y2": 261.77, "r_x3": 308.86, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.44, "r_y0": 270.46, "r_x1": 452.19, "r_y1": 270.46, "r_x2": 452.19, "r_y2": 261.61, "r_x3": 444.44, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89, "r_y0": 270.46, "r_x1": 470.83, "r_y1": 270.46, "r_x2": 470.83, "r_y2": 261.61, "r_x3": 455.89, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83, "r_y0": 270.68, "r_x1": 545.12, "r_y1": 270.68, "r_x2": 545.12, "r_y2": 261.77, "r_x3": 470.83, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.63, "r_x1": 545.12, "r_y1": 282.63, "r_x2": 545.12, "r_y2": 273.73, "r_x3": 308.86, "r_y3": 273.73, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.59, "r_x1": 545.12, "r_y1": 294.59, "r_x2": 545.12, "r_y2": 285.68, "r_x3": 308.86, "r_y3": 285.68, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 306.55, "r_x1": 545.12, "r_y1": 306.55, "r_x2": 545.12, "r_y2": 297.64, "r_x3": 308.86, "r_y3": 297.64, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.5, "r_x1": 545.12, "r_y1": 318.5, "r_x2": 545.12, "r_y2": 309.59, "r_x3": 308.86, "r_y3": 309.59, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.46, "r_x1": 425.92, "r_y1": 330.46, "r_x2": 425.92, "r_y2": 321.55, "r_x3": 308.86, "r_y3": 321.55, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 333.57, "r": 545.12, "b": 450.07, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 342.48, "r_x1": 545.11, "r_y1": 342.48, "r_x2": 545.11, "r_y2": 333.57, "r_x3": 320.82, "r_y3": 333.57, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.43, "r_x1": 545.11, "r_y1": 354.43, "r_x2": 545.11, "r_y2": 345.52, "r_x3": 308.86, "r_y3": 345.52, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.39, "r_x1": 545.12, "r_y1": 366.39, "r_x2": 545.12, "r_y2": 357.48, "r_x3": 308.86, "r_y3": 357.48, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.34, "r_x1": 545.12, "r_y1": 378.34, "r_x2": 545.12, "r_y2": 369.44, "r_x3": 308.86, "r_y3": 369.44, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.3, "r_x1": 545.12, "r_y1": 390.3, "r_x2": 545.12, "r_y2": 381.39, "r_x3": 308.86, "r_y3": 381.39, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.25, "r_x1": 545.12, "r_y1": 402.25, "r_x2": 545.12, "r_y2": 393.35, "r_x3": 308.86, "r_y3": 393.35, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 414.21, "r_x1": 545.12, "r_y1": 414.21, "r_x2": 545.12, "r_y2": 405.3, "r_x3": 308.86, "r_y3": 405.3, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 426.16, "r_x1": 545.12, "r_y1": 426.16, "r_x2": 545.12, "r_y2": 417.26, "r_x3": 308.86, "r_y3": 417.26, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 438.12, "r_x1": 545.12, "r_y1": 438.12, "r_x2": 545.12, "r_y2": 429.21, "r_x3": 308.86, "r_y3": 429.21, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 450.07, "r_x1": 401.29, "r_y1": 450.07, "r_x2": 401.29, "r_y2": 441.17, "r_x3": 308.86, "r_y3": 441.17, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 453.07, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 462.02, "r_x1": 423.26, "r_y1": 462.02, "r_x2": 423.26, "r_y2": 453.07, "r_x3": 320.82, "r_y3": 453.07, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.27, "r_y0": 462.09, "r_x1": 545.11, "r_y1": 462.09, "r_x2": 545.11, "r_y2": 453.19, "r_x3": 423.27, "r_y3": 453.19, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 474.05, "r_x1": 545.12, "r_y1": 474.05, "r_x2": 545.12, "r_y2": 465.14, "r_x3": 308.86, "r_y3": 465.14, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 486.0, "r_x1": 335.7, "r_y1": 486.0, "r_x2": 335.7, "r_y2": 477.1, "r_x3": 308.86, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85, "r_y0": 486.0, "r_x1": 545.12, "r_y1": 486.0, "r_x2": 545.12, "r_y2": 477.1, "r_x3": 345.85, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.96, "r_x1": 545.11, "r_y1": 497.96, "r_x2": 545.11, "r_y2": 489.05, "r_x3": 308.86, "r_y3": 489.05, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.91, "r_x1": 545.11, "r_y1": 509.91, "r_x2": 545.11, "r_y2": 501.01, "r_x3": 308.86, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.87, "r_x1": 545.12, "r_y1": 521.87, "r_x2": 545.12, "r_y2": 512.96, "r_x3": 308.86, "r_y3": 512.96, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.82, "r_x1": 545.12, "r_y1": 533.82, "r_x2": 545.12, "r_y2": 524.92, "r_x3": 308.86, "r_y3": 524.92, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.78, "r_x1": 420.94, "r_y1": 545.78, "r_x2": 420.94, "r_y2": 536.87, "r_x3": 308.86, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59, "r_y0": 545.56, "r_x1": 433.56, "r_y1": 545.56, "r_x2": 433.56, "r_y2": 536.16, "r_x3": 423.59, "r_y3": 536.16, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21, "r_y0": 545.78, "r_x1": 545.11, "r_y1": 545.78, "r_x2": 545.11, "r_y2": 536.87, "r_x3": 436.21, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.73, "r_x1": 545.12, "r_y1": 557.73, "r_x2": 545.12, "r_y2": 548.83, "r_x3": 308.86, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.69, "r_x1": 545.11, "r_y1": 569.69, "r_x2": 545.11, "r_y2": 560.78, "r_x3": 308.86, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.64, "r_x1": 545.11, "r_y1": 581.64, "r_x2": 545.11, "r_y2": 572.74, "r_x3": 308.86, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.6, "r_x1": 545.12, "r_y1": 593.6, "r_x2": 545.12, "r_y2": 584.69, "r_x3": 308.86, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.56, "r_x1": 497.08, "r_y1": 605.56, "r_x2": 497.08, "r_y2": 596.65, "r_x3": 308.86, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.8, "r_y0": 605.34, "r_x1": 509.77, "r_y1": 605.34, "r_x2": 509.77, "r_y2": 595.93, "r_x3": 499.8, "r_y3": 595.93, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.5, "r_y0": 605.56, "r_x1": 545.11, "r_y1": 605.56, "r_x2": 545.11, "r_y2": 596.65, "r_x3": 512.5, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.51, "r_x1": 545.12, "r_y1": 617.51, "r_x2": 545.12, "r_y2": 608.6, "r_x3": 308.86, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.47, "r_x1": 545.12, "r_y1": 629.47, "r_x2": 545.12, "r_y2": 620.56, "r_x3": 308.86, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.42, "r_x1": 364.78, "r_y1": 641.42, "r_x2": 364.78, "r_y2": 632.51, "r_x3": 308.86, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57, "r_y0": 641.19, "r_x1": 415.61, "r_y1": 641.19, "r_x2": 415.61, "r_y2": 632.6, "r_x3": 367.57, "r_y3": 632.6, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61, "r_y0": 641.42, "r_x1": 545.12, "r_y1": 641.42, "r_x2": 545.12, "r_y2": 632.51, "r_x3": 415.61, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.1, "r_x1": 373.6, "r_y1": 665.1, "r_x2": 373.6, "r_y2": 656.51, "r_x3": 308.86, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.91, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.43, "r_x3": 376.91, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.01, "r_x1": 356.9, "r_y1": 689.01, "r_x2": 356.9, "r_y2": 680.42, "r_x3": 308.86, "r_y3": 680.42, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 357.13, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 12, "page_no": 1, "cluster": { "id": 12, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 112.65, "r_y1": 96.07, "r_x2": 112.65, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "considered as a solved problem, given enough ground-truth data to train on." }, { "label": "text", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 99.57, "r": 286.37, "b": 228.03, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 108.48, "r_x1": 286.36, "r_y1": 108.48, "r_x2": 286.36, "r_y2": 99.57, "r_x3": 62.07, "r_y3": 99.57, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.43, "r_x1": 74.75, "r_y1": 120.43, "r_x2": 74.75, "r_y2": 111.53, "r_x3": 50.11, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.33, "r_y0": 120.43, "r_x1": 286.37, "r_y1": 120.43, "r_x2": 286.37, "r_y2": 111.53, "r_x3": 81.33, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 132.39, "r_x1": 286.37, "r_y1": 132.39, "r_x2": 286.37, "r_y2": 123.48, "r_x3": 50.11, "r_y3": 123.48, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 144.34, "r_x1": 286.37, "r_y1": 144.34, "r_x2": 286.37, "r_y2": 135.44, "r_x3": 50.11, "r_y3": 135.44, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 156.3, "r_x1": 286.37, "r_y1": 156.3, "r_x2": 286.37, "r_y2": 147.39, "r_x3": 50.11, "r_y3": 147.39, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 168.25, "r_x1": 286.37, "r_y1": 168.25, "r_x2": 286.37, "r_y2": 159.35, "r_x3": 50.11, "r_y3": 159.35, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.21, "r_x1": 286.37, "r_y1": 180.21, "r_x2": 286.37, "r_y2": 171.3, "r_x3": 50.11, "r_y3": 171.3, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.16, "r_x1": 286.37, "r_y1": 192.16, "r_x2": 286.37, "r_y2": 183.26, "r_x3": 50.11, "r_y3": 183.26, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.12, "r_x1": 286.37, "r_y1": 204.12, "r_x2": 286.37, "r_y2": 195.21, "r_x3": 50.11, "r_y3": 195.21, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.07, "r_x1": 286.37, "r_y1": 216.07, "r_x2": 286.37, "r_y2": 207.17, "r_x3": 50.11, "r_y3": 207.17, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.03, "r_x1": 278.66, "r_y1": 228.03, "r_x2": 278.66, "r_y2": 219.12, "r_x3": 50.11, "r_y3": 219.12, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image." }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 231.53, "r": 286.37, "b": 371.95, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 240.44, "r_x1": 286.36, "r_y1": 240.44, "r_x2": 286.36, "r_y2": 231.53, "r_x3": 62.07, "r_y3": 231.53, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 252.39, "r_x1": 286.37, "r_y1": 252.39, "r_x2": 286.37, "r_y2": 243.49, "r_x3": 50.11, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.35, "r_x1": 286.37, "r_y1": 264.35, "r_x2": 286.37, "r_y2": 255.44, "r_x3": 50.11, "r_y3": 255.44, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.3, "r_x1": 286.37, "r_y1": 276.3, "r_x2": 286.37, "r_y2": 267.4, "r_x3": 50.11, "r_y3": 267.4, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.26, "r_x1": 286.37, "r_y1": 288.26, "r_x2": 286.37, "r_y2": 279.35, "r_x3": 50.11, "r_y3": 279.35, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.21, "r_x1": 88.57, "r_y1": 300.21, "r_x2": 88.57, "r_y2": 291.31, "r_x3": 50.11, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.5, "r_y0": 300.21, "r_x1": 286.37, "r_y1": 300.21, "r_x2": 286.37, "r_y2": 291.31, "r_x3": 95.5, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.17, "r_x1": 286.37, "r_y1": 312.17, "r_x2": 286.37, "r_y2": 303.26, "r_x3": 50.11, "r_y3": 303.26, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.12, "r_x1": 286.37, "r_y1": 324.12, "r_x2": 286.37, "r_y2": 315.22, "r_x3": 50.11, "r_y3": 315.22, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.08, "r_x1": 286.37, "r_y1": 336.08, "r_x2": 286.37, "r_y2": 327.17, "r_x3": 50.11, "r_y3": 327.17, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.03, "r_x1": 286.37, "r_y1": 348.03, "r_x2": 286.37, "r_y2": 339.13, "r_x3": 50.11, "r_y3": 339.13, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.99, "r_x1": 286.37, "r_y1": 359.99, "r_x2": 286.37, "r_y2": 351.08, "r_x3": 50.11, "r_y3": 351.08, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.95, "r_x1": 76.95, "r_y1": 371.95, "r_x2": 76.95, "r_y2": 363.04, "r_x3": 50.11, "r_y3": 363.04, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image." }, { "label": "text", "id": 7, "page_no": 1, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 375.45, "r": 286.37, "b": 432.17, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 384.35, "r_x1": 286.36, "r_y1": 384.35, "r_x2": 286.36, "r_y2": 375.45, "r_x3": 62.07, "r_y3": 375.45, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.31, "r_x1": 120.99, "r_y1": 396.31, "r_x2": 120.99, "r_y2": 387.4, "r_x3": 50.11, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.9, "r_y0": 396.24, "r_x1": 179.73, "r_y1": 396.24, "r_x2": 179.73, "r_y2": 387.28, "r_x3": 123.9, "r_y3": 387.28, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.65, "r_y0": 396.31, "r_x1": 286.37, "r_y1": 396.31, "r_x2": 286.37, "r_y2": 387.4, "r_x3": 182.65, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.26, "r_x1": 181.76, "r_y1": 408.26, "r_x2": 181.76, "r_y2": 399.36, "r_x3": 50.11, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.1, "r_y0": 408.19, "r_x1": 240.2, "r_y1": 408.19, "r_x2": 240.2, "r_y2": 399.24, "r_x3": 184.1, "r_y3": 399.24, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.2, "r_y0": 408.26, "r_x1": 286.36, "r_y1": 408.26, "r_x2": 286.36, "r_y2": 399.36, "r_x3": 240.2, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.22, "r_x1": 286.37, "r_y1": 420.22, "r_x2": 286.37, "r_y2": 411.31, "r_x3": 50.11, "r_y3": 411.31, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.17, "r_x1": 82.52, "r_y1": 432.17, "r_x2": 82.52, "r_y2": 423.27, "r_x3": 50.11, "r_y3": 423.27, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:" }, { "label": "list_item", "id": 6, "page_no": 1, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 61.57, "t": 444.43, "r": 286.36, "b": 489.32, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 453.46, "r_x1": 70.74, "r_y1": 453.46, "r_x2": 70.74, "r_y2": 444.55, "r_x3": 61.57, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.03, "r_y0": 453.46, "r_x1": 117.1, "r_y1": 453.46, "r_x2": 117.1, "r_y2": 444.55, "r_x3": 73.03, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59, "r_y0": 453.39, "r_x1": 175.42, "r_y1": 453.39, "r_x2": 175.42, "r_y2": 444.43, "r_x3": 119.59, "r_y3": 444.43, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42, "r_y0": 453.46, "r_x1": 286.36, "r_y1": 453.46, "r_x2": 286.36, "r_y2": 444.55, "r_x3": 175.42, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 465.41, "r_x1": 286.36, "r_y1": 465.41, "r_x2": 286.36, "r_y2": 456.51, "r_x3": 70.04, "r_y3": 456.51, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 477.37, "r_x1": 286.36, "r_y1": 477.37, "r_x2": 286.36, "r_y2": 468.46, "r_x3": 70.04, "r_y3": 468.46, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 489.32, "r_x1": 99.64, "r_y1": 489.32, "r_x2": 99.64, "r_y2": 480.42, "r_x3": 70.04, "r_y3": 480.42, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach." }, { "label": "list_item", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 61.57, "t": 502.03, "r": 286.36, "b": 546.93, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 511.06, "r_x1": 71.62, "r_y1": 511.06, "r_x2": 71.62, "r_y2": 502.15, "r_x3": 61.57, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.13, "r_y0": 511.06, "r_x1": 196.1, "r_y1": 511.06, "r_x2": 196.1, "r_y2": 502.15, "r_x3": 74.13, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.03, "r_x3": 200.31, "r_y3": 502.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35, "r_y0": 511.06, "r_x1": 286.36, "r_y1": 511.06, "r_x2": 286.36, "r_y2": 502.15, "r_x3": 260.35, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 523.01, "r_x1": 286.36, "r_y1": 523.01, "r_x2": 286.36, "r_y2": 514.11, "r_x3": 70.04, "r_y3": 514.11, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 534.97, "r_x1": 286.36, "r_y1": 534.97, "r_x2": 286.36, "r_y2": 526.06, "r_x3": 70.04, "r_y3": 526.06, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 546.93, "r_x1": 161.65, "r_y1": 546.93, "r_x2": 161.65, "r_y2": 538.02, "r_x3": 70.04, "r_y3": 538.02, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works." }, { "label": "list_item", "id": 9, "page_no": 1, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 61.57, "t": 559.64, "r": 286.36, "b": 592.57, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 568.66, "r_x1": 71.12, "r_y1": 568.66, "r_x2": 71.12, "r_y2": 559.76, "r_x3": 61.57, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.5, "r_y0": 568.66, "r_x1": 116.71, "r_y1": 568.66, "r_x2": 116.71, "r_y2": 559.76, "r_x3": 73.5, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.58, "r_y0": 568.59, "r_x1": 177.68, "r_y1": 568.59, "r_x2": 177.68, "r_y2": 559.64, "r_x3": 121.58, "r_y3": 559.64, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55, "r_y0": 568.66, "r_x1": 286.36, "r_y1": 568.66, "r_x2": 286.36, "r_y2": 559.76, "r_x3": 182.55, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 580.62, "r_x1": 286.36, "r_y1": 580.62, "r_x2": 286.36, "r_y2": 571.71, "r_x3": 70.04, "r_y3": 571.71, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 592.57, "r_x1": 82.4, "r_y1": 592.57, "r_x2": 82.4, "r_y2": 583.67, "r_x3": 70.04, "r_y3": 583.67, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity." }, { "label": "list_item", "id": 8, "page_no": 1, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 61.57, "t": 605.4, "r": 286.37, "b": 638.22, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 614.31, "r_x1": 72.33, "r_y1": 614.31, "r_x2": 72.33, "r_y2": 605.4, "r_x3": 61.57, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.02, "r_y0": 614.31, "r_x1": 286.37, "r_y1": 614.31, "r_x2": 286.37, "r_y2": 605.4, "r_x3": 75.02, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 626.26, "r_x1": 286.36, "r_y1": 626.26, "r_x2": 286.36, "r_y2": 617.36, "r_x3": 70.04, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 638.22, "r_x1": 198.06, "r_y1": 638.22, "r_x2": 198.06, "r_y2": 629.31, "r_x3": 70.04, "r_y3": 629.31, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility." }, { "label": "text", "id": 11, "page_no": 1, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 650.6, "r": 286.37, "b": 695.37, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 659.5, "r_x1": 286.36, "r_y1": 659.5, "r_x2": 286.36, "r_y2": 650.6, "r_x3": 62.07, "r_y3": 650.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 671.46, "r_x1": 286.37, "r_y1": 671.46, "r_x2": 286.37, "r_y2": 662.55, "r_x3": 50.11, "r_y3": 662.55, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 683.41, "r_x1": 286.37, "r_y1": 683.41, "r_x2": 286.37, "r_y2": 674.51, "r_x3": 50.11, "r_y3": 674.51, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 695.37, "r_x1": 286.37, "r_y1": 695.37, "r_x2": 286.37, "r_y2": 686.46, "r_x3": 50.11, "r_y3": 686.46, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe" }, { "label": "footnote", "id": 14, "page_no": 1, "cluster": { "id": 14, "label": "footnote", "bbox": { "l": 60.97, "t": 705.6, "r": 183.73, "b": 712.72, "coord_origin": "TOPLEFT" }, "confidence": 0.895, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97, "r_y0": 712.72, "r_x1": 183.73, "r_y1": 712.72, "r_x2": 183.73, "r_y2": 705.6, "r_x3": 60.97, "r_y3": 705.6, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "$^{1}$https://github.com/IBM/SynthTabNet" }, { "label": "text", "id": 10, "page_no": 1, "cluster": { "id": 10, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 508.08, "r_y1": 108.02, "r_x2": 508.08, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community." }, { "label": "section_header", "id": 13, "page_no": 1, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 308.86, "t": 121.73, "r": 498.28, "b": 132.48, "coord_origin": "TOPLEFT" }, "confidence": 0.943, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 132.48, "r_x1": 315.58, "r_y1": 132.48, "r_x2": 315.58, "r_y2": 121.73, "r_x3": 308.86, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54, "r_y0": 132.48, "r_x1": 498.28, "r_y1": 132.48, "r_x2": 498.28, "r_y2": 121.73, "r_x3": 324.54, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Previous work and State of the Art" }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 142.22, "r": 545.12, "b": 330.46, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 151.13, "r_x1": 545.11, "r_y1": 151.13, "r_x2": 545.11, "r_y2": 142.22, "r_x3": 320.82, "r_y3": 142.22, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 163.08, "r_x1": 545.12, "r_y1": 163.08, "r_x2": 545.12, "r_y2": 154.18, "r_x3": 308.86, "r_y3": 154.18, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 175.04, "r_x1": 522.56, "r_y1": 175.04, "r_x2": 522.56, "r_y2": 166.13, "r_x3": 308.86, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 175.04, "r_x1": 545.12, "r_y1": 175.04, "r_x2": 545.12, "r_y2": 166.13, "r_x3": 529.62, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 186.99, "r_x1": 545.12, "r_y1": 186.99, "r_x2": 545.12, "r_y2": 178.09, "r_x3": 308.86, "r_y3": 178.09, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 198.95, "r_x1": 545.12, "r_y1": 198.95, "r_x2": 545.12, "r_y2": 190.04, "r_x3": 308.86, "r_y3": 190.04, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 210.9, "r_x1": 346.98, "r_y1": 210.9, "r_x2": 346.98, "r_y2": 202.0, "r_x3": 308.86, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.87, "r_y0": 210.9, "r_x1": 545.12, "r_y1": 210.9, "r_x2": 545.12, "r_y2": 202.0, "r_x3": 354.87, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 222.86, "r_x1": 545.12, "r_y1": 222.86, "r_x2": 545.12, "r_y2": 213.95, "r_x3": 308.86, "r_y3": 213.95, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 234.81, "r_x1": 530.92, "r_y1": 234.81, "r_x2": 530.92, "r_y2": 225.91, "r_x3": 308.86, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92, "r_y0": 234.81, "r_x1": 545.12, "r_y1": 234.81, "r_x2": 545.12, "r_y2": 225.91, "r_x3": 537.92, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 246.77, "r_x1": 545.12, "r_y1": 246.77, "r_x2": 545.12, "r_y2": 237.86, "r_x3": 308.86, "r_y3": 237.86, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.72, "r_x1": 545.12, "r_y1": 258.72, "r_x2": 545.12, "r_y2": 249.82, "r_x3": 308.86, "r_y3": 249.82, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.68, "r_x1": 439.84, "r_y1": 270.68, "r_x2": 439.84, "r_y2": 261.77, "r_x3": 308.86, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.44, "r_y0": 270.46, "r_x1": 452.19, "r_y1": 270.46, "r_x2": 452.19, "r_y2": 261.61, "r_x3": 444.44, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89, "r_y0": 270.46, "r_x1": 470.83, "r_y1": 270.46, "r_x2": 470.83, "r_y2": 261.61, "r_x3": 455.89, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83, "r_y0": 270.68, "r_x1": 545.12, "r_y1": 270.68, "r_x2": 545.12, "r_y2": 261.77, "r_x3": 470.83, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.63, "r_x1": 545.12, "r_y1": 282.63, "r_x2": 545.12, "r_y2": 273.73, "r_x3": 308.86, "r_y3": 273.73, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.59, "r_x1": 545.12, "r_y1": 294.59, "r_x2": 545.12, "r_y2": 285.68, "r_x3": 308.86, "r_y3": 285.68, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 306.55, "r_x1": 545.12, "r_y1": 306.55, "r_x2": 545.12, "r_y2": 297.64, "r_x3": 308.86, "r_y3": 297.64, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.5, "r_x1": 545.12, "r_y1": 318.5, "r_x2": 545.12, "r_y2": 309.59, "r_x3": 308.86, "r_y3": 309.59, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.46, "r_x1": 425.92, "r_y1": 330.46, "r_x2": 425.92, "r_y2": 321.55, "r_x3": 308.86, "r_y3": 321.55, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc." }, { "label": "text", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 333.57, "r": 545.12, "b": 450.07, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 342.48, "r_x1": 545.11, "r_y1": 342.48, "r_x2": 545.11, "r_y2": 333.57, "r_x3": 320.82, "r_y3": 333.57, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.43, "r_x1": 545.11, "r_y1": 354.43, "r_x2": 545.11, "r_y2": 345.52, "r_x3": 308.86, "r_y3": 345.52, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.39, "r_x1": 545.12, "r_y1": 366.39, "r_x2": 545.12, "r_y2": 357.48, "r_x3": 308.86, "r_y3": 357.48, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.34, "r_x1": 545.12, "r_y1": 378.34, "r_x2": 545.12, "r_y2": 369.44, "r_x3": 308.86, "r_y3": 369.44, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.3, "r_x1": 545.12, "r_y1": 390.3, "r_x2": 545.12, "r_y2": 381.39, "r_x3": 308.86, "r_y3": 381.39, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.25, "r_x1": 545.12, "r_y1": 402.25, "r_x2": 545.12, "r_y2": 393.35, "r_x3": 308.86, "r_y3": 393.35, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 414.21, "r_x1": 545.12, "r_y1": 414.21, "r_x2": 545.12, "r_y2": 405.3, "r_x3": 308.86, "r_y3": 405.3, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 426.16, "r_x1": 545.12, "r_y1": 426.16, "r_x2": 545.12, "r_y2": 417.26, "r_x3": 308.86, "r_y3": 417.26, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 438.12, "r_x1": 545.12, "r_y1": 438.12, "r_x2": 545.12, "r_y2": 429.21, "r_x3": 308.86, "r_y3": 429.21, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 450.07, "r_x1": 401.29, "r_y1": 450.07, "r_x2": 401.29, "r_y2": 441.17, "r_x3": 308.86, "r_y3": 441.17, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification." }, { "label": "text", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 453.07, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 462.02, "r_x1": 423.26, "r_y1": 462.02, "r_x2": 423.26, "r_y2": 453.07, "r_x3": 320.82, "r_y3": 453.07, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.27, "r_y0": 462.09, "r_x1": 545.11, "r_y1": 462.09, "r_x2": 545.11, "r_y2": 453.19, "r_x3": 423.27, "r_y3": 453.19, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 474.05, "r_x1": 545.12, "r_y1": 474.05, "r_x2": 545.12, "r_y2": 465.14, "r_x3": 308.86, "r_y3": 465.14, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 486.0, "r_x1": 335.7, "r_y1": 486.0, "r_x2": 335.7, "r_y2": 477.1, "r_x3": 308.86, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85, "r_y0": 486.0, "r_x1": 545.12, "r_y1": 486.0, "r_x2": 545.12, "r_y2": 477.1, "r_x3": 345.85, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.96, "r_x1": 545.11, "r_y1": 497.96, "r_x2": 545.11, "r_y2": 489.05, "r_x3": 308.86, "r_y3": 489.05, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.91, "r_x1": 545.11, "r_y1": 509.91, "r_x2": 545.11, "r_y2": 501.01, "r_x3": 308.86, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.87, "r_x1": 545.12, "r_y1": 521.87, "r_x2": 545.12, "r_y2": 512.96, "r_x3": 308.86, "r_y3": 512.96, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.82, "r_x1": 545.12, "r_y1": 533.82, "r_x2": 545.12, "r_y2": 524.92, "r_x3": 308.86, "r_y3": 524.92, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.78, "r_x1": 420.94, "r_y1": 545.78, "r_x2": 420.94, "r_y2": 536.87, "r_x3": 308.86, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59, "r_y0": 545.56, "r_x1": 433.56, "r_y1": 545.56, "r_x2": 433.56, "r_y2": 536.16, "r_x3": 423.59, "r_y3": 536.16, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21, "r_y0": 545.78, "r_x1": 545.11, "r_y1": 545.78, "r_x2": 545.11, "r_y2": 536.87, "r_x3": 436.21, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.73, "r_x1": 545.12, "r_y1": 557.73, "r_x2": 545.12, "r_y2": 548.83, "r_x3": 308.86, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.69, "r_x1": 545.11, "r_y1": 569.69, "r_x2": 545.11, "r_y2": 560.78, "r_x3": 308.86, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.64, "r_x1": 545.11, "r_y1": 581.64, "r_x2": 545.11, "r_y2": 572.74, "r_x3": 308.86, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.6, "r_x1": 545.12, "r_y1": 593.6, "r_x2": 545.12, "r_y2": 584.69, "r_x3": 308.86, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.56, "r_x1": 497.08, "r_y1": 605.56, "r_x2": 497.08, "r_y2": 596.65, "r_x3": 308.86, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.8, "r_y0": 605.34, "r_x1": 509.77, "r_y1": 605.34, "r_x2": 509.77, "r_y2": 595.93, "r_x3": 499.8, "r_y3": 595.93, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.5, "r_y0": 605.56, "r_x1": 545.11, "r_y1": 605.56, "r_x2": 545.11, "r_y2": 596.65, "r_x3": 512.5, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.51, "r_x1": 545.12, "r_y1": 617.51, "r_x2": 545.12, "r_y2": 608.6, "r_x3": 308.86, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.47, "r_x1": 545.12, "r_y1": 629.47, "r_x2": 545.12, "r_y2": 620.56, "r_x3": 308.86, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.42, "r_x1": 364.78, "r_y1": 641.42, "r_x2": 364.78, "r_y2": 632.51, "r_x3": 308.86, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57, "r_y0": 641.19, "r_x1": 415.61, "r_y1": 641.19, "r_x2": 415.61, "r_y2": 632.6, "r_x3": 367.57, "r_y3": 632.6, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61, "r_y0": 641.42, "r_x1": 545.12, "r_y1": 641.42, "r_x2": 545.12, "r_y2": 632.51, "r_x3": 415.61, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.1, "r_x1": 373.6, "r_y1": 665.1, "r_x2": 373.6, "r_y2": 656.51, "r_x3": 308.86, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.91, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.43, "r_x3": 376.91, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.01, "r_x1": 356.9, "r_y1": 689.01, "r_x2": 356.9, "r_y2": 680.42, "r_x3": 308.86, "r_y3": 680.42, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 357.13, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the" }, { "label": "page_footer", "id": 15, "page_no": 1, "cluster": { "id": 15, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" } ], "body": [ { "label": "text", "id": 12, "page_no": 1, "cluster": { "id": 12, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 112.65, "r_y1": 96.07, "r_x2": 112.65, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "considered as a solved problem, given enough ground-truth data to train on." }, { "label": "text", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 99.57, "r": 286.37, "b": 228.03, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 108.48, "r_x1": 286.36, "r_y1": 108.48, "r_x2": 286.36, "r_y2": 99.57, "r_x3": 62.07, "r_y3": 99.57, "coord_origin": "TOPLEFT" }, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.43, "r_x1": 74.75, "r_y1": 120.43, "r_x2": 74.75, "r_y2": 111.53, "r_x3": 50.11, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.33, "r_y0": 120.43, "r_x1": 286.37, "r_y1": 120.43, "r_x2": 286.37, "r_y2": 111.53, "r_x3": 81.33, "r_y3": 111.53, "coord_origin": "TOPLEFT" }, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 132.39, "r_x1": 286.37, "r_y1": 132.39, "r_x2": 286.37, "r_y2": 123.48, "r_x3": 50.11, "r_y3": 123.48, "coord_origin": "TOPLEFT" }, "text": "munity of document understanding [6, 4, 14]. Contrary to", "orig": "munity of document understanding [6, 4, 14]. Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 144.34, "r_x1": 286.37, "r_y1": 144.34, "r_x2": 286.37, "r_y2": 135.44, "r_x3": 50.11, "r_y3": 135.44, "coord_origin": "TOPLEFT" }, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 156.3, "r_x1": 286.37, "r_y1": 156.3, "r_x2": 286.37, "r_y2": 147.39, "r_x3": 50.11, "r_y3": 147.39, "coord_origin": "TOPLEFT" }, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 168.25, "r_x1": 286.37, "r_y1": 168.25, "r_x2": 286.37, "r_y2": 159.35, "r_x3": 50.11, "r_y3": 159.35, "coord_origin": "TOPLEFT" }, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.21, "r_x1": 286.37, "r_y1": 180.21, "r_x2": 286.37, "r_y2": 171.3, "r_x3": 50.11, "r_y3": 171.3, "coord_origin": "TOPLEFT" }, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.16, "r_x1": 286.37, "r_y1": 192.16, "r_x2": 286.37, "r_y2": 183.26, "r_x3": 50.11, "r_y3": 183.26, "coord_origin": "TOPLEFT" }, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.12, "r_x1": 286.37, "r_y1": 204.12, "r_x2": 286.37, "r_y2": 195.21, "r_x3": 50.11, "r_y3": 195.21, "coord_origin": "TOPLEFT" }, "text": "nesses (see Sec. 2). The common denominator here is the", "orig": "nesses (see Sec. 2). The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.07, "r_x1": 286.37, "r_y1": 216.07, "r_x2": 286.37, "r_y2": 207.17, "r_x3": 50.11, "r_y3": 207.17, "coord_origin": "TOPLEFT" }, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.03, "r_x1": 278.66, "r_y1": 228.03, "r_x2": 278.66, "r_y2": 219.12, "r_x3": 50.11, "r_y3": 219.12, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image." }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 231.53, "r": 286.37, "b": 371.95, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 240.44, "r_x1": 286.36, "r_y1": 240.44, "r_x2": 286.36, "r_y2": 231.53, "r_x3": 62.07, "r_y3": 231.53, "coord_origin": "TOPLEFT" }, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 252.39, "r_x1": 286.37, "r_y1": 252.39, "r_x2": 286.37, "r_y2": 243.49, "r_x3": 50.11, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "present a robust table-structure decomposition algorithm.", "orig": "present a robust table-structure decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.35, "r_x1": 286.37, "r_y1": 264.35, "r_x2": 286.37, "r_y2": 255.44, "r_x3": 50.11, "r_y3": 255.44, "coord_origin": "TOPLEFT" }, "text": "The design criteria for our model are the following. First,", "orig": "The design criteria for our model are the following. First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.3, "r_x1": 286.37, "r_y1": 276.3, "r_x2": 286.37, "r_y2": 267.4, "r_x3": 50.11, "r_y3": 267.4, "coord_origin": "TOPLEFT" }, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.26, "r_x1": 286.37, "r_y1": 288.26, "r_x2": 286.37, "r_y2": 279.35, "r_x3": 50.11, "r_y3": 279.35, "coord_origin": "TOPLEFT" }, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.21, "r_x1": 88.57, "r_y1": 300.21, "r_x2": 88.57, "r_y2": 291.31, "r_x3": 50.11, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 95.5, "r_y0": 300.21, "r_x1": 286.37, "r_y1": 300.21, "r_x2": 286.37, "r_y2": 291.31, "r_x3": 95.5, "r_y3": 291.31, "coord_origin": "TOPLEFT" }, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.17, "r_x1": 286.37, "r_y1": 312.17, "r_x2": 286.37, "r_y2": 303.26, "r_x3": 50.11, "r_y3": 303.26, "coord_origin": "TOPLEFT" }, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.12, "r_x1": 286.37, "r_y1": 324.12, "r_x2": 286.37, "r_y2": 315.22, "r_x3": 50.11, "r_y3": 315.22, "coord_origin": "TOPLEFT" }, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.08, "r_x1": 286.37, "r_y1": 336.08, "r_x2": 286.37, "r_y2": 327.17, "r_x3": 50.11, "r_y3": 327.17, "coord_origin": "TOPLEFT" }, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.03, "r_x1": 286.37, "r_y1": 348.03, "r_x2": 286.37, "r_y2": 339.13, "r_x3": 50.11, "r_y3": 339.13, "coord_origin": "TOPLEFT" }, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.99, "r_x1": 286.37, "r_y1": 359.99, "r_x2": 286.37, "r_y2": 351.08, "r_x3": 50.11, "r_y3": 351.08, "coord_origin": "TOPLEFT" }, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.95, "r_x1": 76.95, "r_y1": 371.95, "r_x2": 76.95, "r_y2": 363.04, "r_x3": 50.11, "r_y3": 363.04, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image." }, { "label": "text", "id": 7, "page_no": 1, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 375.45, "r": 286.37, "b": 432.17, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 384.35, "r_x1": 286.36, "r_y1": 384.35, "r_x2": 286.36, "r_y2": 375.45, "r_x3": 62.07, "r_y3": 375.45, "coord_origin": "TOPLEFT" }, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.31, "r_x1": 120.99, "r_y1": 396.31, "r_x2": 120.99, "r_y2": 387.4, "r_x3": 50.11, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 123.9, "r_y0": 396.24, "r_x1": 179.73, "r_y1": 396.24, "r_x2": 179.73, "r_y2": 387.28, "r_x3": 123.9, "r_y3": 387.28, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.65, "r_y0": 396.31, "r_x1": 286.37, "r_y1": 396.31, "r_x2": 286.37, "r_y2": 387.4, "r_x3": 182.65, "r_y3": 387.4, "coord_origin": "TOPLEFT" }, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.26, "r_x1": 181.76, "r_y1": 408.26, "r_x2": 181.76, "r_y2": 399.36, "r_x3": 50.11, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.1, "r_y0": 408.19, "r_x1": 240.2, "r_y1": 408.19, "r_x2": 240.2, "r_y2": 399.24, "r_x3": 184.1, "r_y3": 399.24, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.2, "r_y0": 408.26, "r_x1": 286.36, "r_y1": 408.26, "r_x2": 286.36, "r_y2": 399.36, "r_x3": 240.2, "r_y3": 399.36, "coord_origin": "TOPLEFT" }, "text": "$^{1}$. In partic-", "orig": "$^{1}$. In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.22, "r_x1": 286.37, "r_y1": 420.22, "r_x2": 286.37, "r_y2": 411.31, "r_x3": 50.11, "r_y3": 411.31, "coord_origin": "TOPLEFT" }, "text": "ular, our contributions in this work can be summarised as", "orig": "ular, our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.17, "r_x1": 82.52, "r_y1": 432.17, "r_x2": 82.52, "r_y2": 423.27, "r_x3": 50.11, "r_y3": 423.27, "coord_origin": "TOPLEFT" }, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:" }, { "label": "list_item", "id": 6, "page_no": 1, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 61.57, "t": 444.43, "r": 286.36, "b": 489.32, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 453.46, "r_x1": 70.74, "r_y1": 453.46, "r_x2": 70.74, "r_y2": 444.55, "r_x3": 61.57, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.03, "r_y0": 453.46, "r_x1": 117.1, "r_y1": 453.46, "r_x2": 117.1, "r_y2": 444.55, "r_x3": 73.03, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.59, "r_y0": 453.39, "r_x1": 175.42, "r_y1": 453.39, "r_x2": 175.42, "r_y2": 444.43, "r_x3": 119.59, "r_y3": 444.43, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.42, "r_y0": 453.46, "r_x1": 286.36, "r_y1": 453.46, "r_x2": 286.36, "r_y2": 444.55, "r_x3": 175.42, "r_y3": 444.55, "coord_origin": "TOPLEFT" }, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 465.41, "r_x1": 286.36, "r_y1": 465.41, "r_x2": 286.36, "r_y2": 456.51, "r_x3": 70.04, "r_y3": 456.51, "coord_origin": "TOPLEFT" }, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 477.37, "r_x1": 286.36, "r_y1": 477.37, "r_x2": 286.36, "r_y2": 468.46, "r_x3": 70.04, "r_y3": 468.46, "coord_origin": "TOPLEFT" }, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 489.32, "r_x1": 99.64, "r_y1": 489.32, "r_x2": 99.64, "r_y2": 480.42, "r_x3": 70.04, "r_y3": 480.42, "coord_origin": "TOPLEFT" }, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach." }, { "label": "list_item", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 61.57, "t": 502.03, "r": 286.36, "b": 546.93, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 511.06, "r_x1": 71.62, "r_y1": 511.06, "r_x2": 71.62, "r_y2": 502.15, "r_x3": 61.57, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.13, "r_y0": 511.06, "r_x1": 196.1, "r_y1": 511.06, "r_x2": 196.1, "r_y2": 502.15, "r_x3": 74.13, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "Across all benchmark datasets", "orig": "Across all benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.03, "r_x3": 200.31, "r_y3": 502.03, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.35, "r_y0": 511.06, "r_x1": 286.36, "r_y1": 511.06, "r_x2": 286.36, "r_y2": 502.15, "r_x3": 260.35, "r_y3": 502.15, "coord_origin": "TOPLEFT" }, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 523.01, "r_x1": 286.36, "r_y1": 523.01, "r_x2": 286.36, "r_y2": 514.11, "r_x3": 70.04, "r_y3": 514.11, "coord_origin": "TOPLEFT" }, "text": "icantly outperforms existing state-of-the-art metrics,", "orig": "icantly outperforms existing state-of-the-art metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 534.97, "r_x1": 286.36, "r_y1": 534.97, "r_x2": 286.36, "r_y2": 526.06, "r_x3": 70.04, "r_y3": 526.06, "coord_origin": "TOPLEFT" }, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 546.93, "r_x1": 161.65, "r_y1": 546.93, "r_x2": 161.65, "r_y2": 538.02, "r_x3": 70.04, "r_y3": 538.02, "coord_origin": "TOPLEFT" }, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works." }, { "label": "list_item", "id": 9, "page_no": 1, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 61.57, "t": 559.64, "r": 286.36, "b": 592.57, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 568.66, "r_x1": 71.12, "r_y1": 568.66, "r_x2": 71.12, "r_y2": 559.76, "r_x3": 61.57, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.5, "r_y0": 568.66, "r_x1": 116.71, "r_y1": 568.66, "r_x2": 116.71, "r_y2": 559.76, "r_x3": 73.5, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 121.58, "r_y0": 568.59, "r_x1": 177.68, "r_y1": 568.59, "r_x2": 177.68, "r_y2": 559.64, "r_x3": 121.58, "r_y3": 559.64, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.55, "r_y0": 568.66, "r_x1": 286.36, "r_y1": 568.66, "r_x2": 286.36, "r_y2": 559.76, "r_x3": 182.55, "r_y3": 559.76, "coord_origin": "TOPLEFT" }, "text": "a synthetically generated", "orig": "a synthetically generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 580.62, "r_x1": 286.36, "r_y1": 580.62, "r_x2": 286.36, "r_y2": 571.71, "r_x3": 70.04, "r_y3": 571.71, "coord_origin": "TOPLEFT" }, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 592.57, "r_x1": 82.4, "r_y1": 592.57, "r_x2": 82.4, "r_y2": 583.67, "r_x3": 70.04, "r_y3": 583.67, "coord_origin": "TOPLEFT" }, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity." }, { "label": "list_item", "id": 8, "page_no": 1, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 61.57, "t": 605.4, "r": 286.37, "b": 638.22, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 614.31, "r_x1": 72.33, "r_y1": 614.31, "r_x2": 72.33, "r_y2": 605.4, "r_x3": 61.57, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.02, "r_y0": 614.31, "r_x1": 286.37, "r_y1": 614.31, "r_x2": 286.37, "r_y2": 605.4, "r_x3": 75.02, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "An augmented dataset based on PubTabNet [37],", "orig": "An augmented dataset based on PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 626.26, "r_x1": 286.36, "r_y1": 626.26, "r_x2": 286.36, "r_y2": 617.36, "r_x3": 70.04, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] with generated", "orig": "FinTabNet [36], and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 638.22, "r_x1": 198.06, "r_y1": 638.22, "r_x2": 198.06, "r_y2": 629.31, "r_x3": 70.04, "r_y3": 629.31, "coord_origin": "TOPLEFT" }, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility." }, { "label": "text", "id": 11, "page_no": 1, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 650.6, "r": 286.37, "b": 695.37, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 659.5, "r_x1": 286.36, "r_y1": 659.5, "r_x2": 286.36, "r_y2": 650.6, "r_x3": 62.07, "r_y3": 650.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In Sec. 2, we give", "orig": "The paper is structured as follows. In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 671.46, "r_x1": 286.37, "r_y1": 671.46, "r_x2": 286.37, "r_y2": 662.55, "r_x3": 50.11, "r_y3": 662.55, "coord_origin": "TOPLEFT" }, "text": "a brief overview of the current state-of-the-art. In Sec. 3,", "orig": "a brief overview of the current state-of-the-art. In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 683.41, "r_x1": 286.37, "r_y1": 683.41, "r_x2": 286.37, "r_y2": 674.51, "r_x3": 50.11, "r_y3": 674.51, "coord_origin": "TOPLEFT" }, "text": "we describe the datasets on which we train. In Sec. 4, we", "orig": "we describe the datasets on which we train. In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 695.37, "r_x1": 286.37, "r_y1": 695.37, "r_x2": 286.37, "r_y2": 686.46, "r_x3": 50.11, "r_y3": 686.46, "coord_origin": "TOPLEFT" }, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe" }, { "label": "footnote", "id": 14, "page_no": 1, "cluster": { "id": 14, "label": "footnote", "bbox": { "l": 60.97, "t": 705.6, "r": 183.73, "b": 712.72, "coord_origin": "TOPLEFT" }, "confidence": 0.895, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.97, "r_y0": 712.72, "r_x1": 183.73, "r_y1": 712.72, "r_x2": 183.73, "r_y2": 705.6, "r_x3": 60.97, "r_y3": 705.6, "coord_origin": "TOPLEFT" }, "text": "$^{1}$https://github.com/IBM/SynthTabNet", "orig": "$^{1}$https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "$^{1}$https://github.com/IBM/SynthTabNet" }, { "label": "text", "id": 10, "page_no": 1, "cluster": { "id": 10, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "its results & performance in Sec. 5. As a conclusion, we de-", "orig": "its results & performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 508.08, "r_y1": 108.02, "r_x2": 508.08, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community." }, { "label": "section_header", "id": 13, "page_no": 1, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 308.86, "t": 121.73, "r": 498.28, "b": 132.48, "coord_origin": "TOPLEFT" }, "confidence": 0.943, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 132.48, "r_x1": 315.58, "r_y1": 132.48, "r_x2": 315.58, "r_y2": 121.73, "r_x3": 308.86, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.54, "r_y0": 132.48, "r_x1": 498.28, "r_y1": 132.48, "r_x2": 498.28, "r_y2": 121.73, "r_x3": 324.54, "r_y3": 121.73, "coord_origin": "TOPLEFT" }, "text": "Previous work and State of the Art", "orig": "Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Previous work and State of the Art" }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 142.22, "r": 545.12, "b": 330.46, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 151.13, "r_x1": 545.11, "r_y1": 151.13, "r_x2": 545.11, "r_y2": 142.22, "r_x3": 320.82, "r_y3": 142.22, "coord_origin": "TOPLEFT" }, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 163.08, "r_x1": 545.12, "r_y1": 163.08, "r_x2": 545.12, "r_y2": 154.18, "r_x3": 308.86, "r_y3": 154.18, "coord_origin": "TOPLEFT" }, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 175.04, "r_x1": 522.56, "r_y1": 175.04, "r_x2": 522.56, "r_y2": 166.13, "r_x3": 308.86, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "tivates many organised public challenges [6, 4, 14].", "orig": "tivates many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 175.04, "r_x1": 545.12, "r_y1": 175.04, "r_x2": 545.12, "r_y2": 166.13, "r_x3": 529.62, "r_y3": 166.13, "coord_origin": "TOPLEFT" }, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 186.99, "r_x1": 545.12, "r_y1": 186.99, "r_x2": 545.12, "r_y2": 178.09, "r_x3": 308.86, "r_y3": 178.09, "coord_origin": "TOPLEFT" }, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 198.95, "r_x1": 545.12, "r_y1": 198.95, "r_x2": 545.12, "r_y2": 190.04, "r_x3": 308.86, "r_y3": 190.04, "coord_origin": "TOPLEFT" }, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 210.9, "r_x1": 346.98, "r_y1": 210.9, "r_x2": 346.98, "r_y2": 202.0, "r_x3": 308.86, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.87, "r_y0": 210.9, "r_x1": 545.12, "r_y1": 210.9, "r_x2": 545.12, "r_y2": 202.0, "r_x3": 354.87, "r_y3": 202.0, "coord_origin": "TOPLEFT" }, "text": "Such large variety requires a flexible method.", "orig": "Such large variety requires a flexible method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 222.86, "r_x1": 545.12, "r_y1": 222.86, "r_x2": 545.12, "r_y2": 213.95, "r_x3": 308.86, "r_y3": 213.95, "coord_origin": "TOPLEFT" }, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 234.81, "r_x1": 530.92, "r_y1": 234.81, "r_x2": 530.92, "r_y2": 225.91, "r_x3": 308.86, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "ers, which can be extremely intricate and demanding.", "orig": "ers, which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.92, "r_y0": 234.81, "r_x1": 545.12, "r_y1": 234.81, "r_x2": 545.12, "r_y2": 225.91, "r_x3": 537.92, "r_y3": 225.91, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 246.77, "r_x1": 545.12, "r_y1": 246.77, "r_x2": 545.12, "r_y2": 237.86, "r_x3": 308.86, "r_y3": 237.86, "coord_origin": "TOPLEFT" }, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.72, "r_x1": 545.12, "r_y1": 258.72, "r_x2": 545.12, "r_y2": 249.82, "r_x3": 308.86, "r_y3": 249.82, "coord_origin": "TOPLEFT" }, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.68, "r_x1": 439.84, "r_y1": 270.68, "r_x2": 439.84, "r_y2": 261.77, "r_x3": 308.86, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.44, "r_y0": 270.46, "r_x1": 452.19, "r_y1": 270.46, "r_x2": 452.19, "r_y2": 261.61, "r_x3": 444.44, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.89, "r_y0": 270.46, "r_x1": 470.83, "r_y1": 270.46, "r_x2": 470.83, "r_y2": 261.61, "r_x3": 455.89, "r_y3": 261.61, "coord_origin": "TOPLEFT" }, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 470.83, "r_y0": 270.68, "r_x1": 545.12, "r_y1": 270.68, "r_x2": 545.12, "r_y2": 261.77, "r_x3": 470.83, "r_y3": 261.77, "coord_origin": "TOPLEFT" }, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.63, "r_x1": 545.12, "r_y1": 282.63, "r_x2": 545.12, "r_y2": 273.73, "r_x3": 308.86, "r_y3": 273.73, "coord_origin": "TOPLEFT" }, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.59, "r_x1": 545.12, "r_y1": 294.59, "r_x2": 545.12, "r_y2": 285.68, "r_x3": 308.86, "r_y3": 285.68, "coord_origin": "TOPLEFT" }, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 306.55, "r_x1": 545.12, "r_y1": 306.55, "r_x2": 545.12, "r_y2": 297.64, "r_x3": 308.86, "r_y3": 297.64, "coord_origin": "TOPLEFT" }, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.5, "r_x1": 545.12, "r_y1": 318.5, "r_x2": 545.12, "r_y2": 309.59, "r_x3": 308.86, "r_y3": 309.59, "coord_origin": "TOPLEFT" }, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.46, "r_x1": 425.92, "r_y1": 330.46, "r_x2": 425.92, "r_y2": 321.55, "r_x3": 308.86, "r_y3": 321.55, "coord_origin": "TOPLEFT" }, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc." }, { "label": "text", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 333.57, "r": 545.12, "b": 450.07, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 342.48, "r_x1": 545.11, "r_y1": 342.48, "r_x2": 545.11, "r_y2": 333.57, "r_x3": 320.82, "r_y3": 333.57, "coord_origin": "TOPLEFT" }, "text": "Before the rising popularity of deep neural networks,", "orig": "Before the rising popularity of deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.43, "r_x1": 545.11, "r_y1": 354.43, "r_x2": 545.11, "r_y2": 345.52, "r_x3": 308.86, "r_y3": 345.52, "coord_origin": "TOPLEFT" }, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.39, "r_x1": 545.12, "r_y1": 366.39, "r_x2": 545.12, "r_y2": 357.48, "r_x3": 308.86, "r_y3": 357.48, "coord_origin": "TOPLEFT" }, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.34, "r_x1": 545.12, "r_y1": 378.34, "r_x2": 545.12, "r_y2": 369.44, "r_x3": 308.86, "r_y3": 369.44, "coord_origin": "TOPLEFT" }, "text": "28]. Although such methods work well on constrained ta-", "orig": "28]. Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.3, "r_x1": 545.12, "r_y1": 390.3, "r_x2": 545.12, "r_y2": 381.39, "r_x3": 308.86, "r_y3": 381.39, "coord_origin": "TOPLEFT" }, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.25, "r_x1": 545.12, "r_y1": 402.25, "r_x2": 545.12, "r_y2": 393.35, "r_x3": 308.86, "r_y3": 393.35, "coord_origin": "TOPLEFT" }, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 414.21, "r_x1": 545.12, "r_y1": 414.21, "r_x2": 545.12, "r_y2": 405.3, "r_x3": 308.86, "r_y3": 405.3, "coord_origin": "TOPLEFT" }, "text": "the availability of large datasets. To the best-of-our knowl-", "orig": "the availability of large datasets. To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 426.16, "r_x1": 545.12, "r_y1": 426.16, "r_x2": 545.12, "r_y2": 417.26, "r_x3": 308.86, "r_y3": 417.26, "coord_origin": "TOPLEFT" }, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 438.12, "r_x1": 545.12, "r_y1": 438.12, "r_x2": 545.12, "r_y2": 429.21, "r_x3": 308.86, "r_y3": 429.21, "coord_origin": "TOPLEFT" }, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 450.07, "r_x1": 401.29, "r_y1": 450.07, "r_x2": 401.29, "r_y2": 441.17, "r_x3": 308.86, "r_y3": 441.17, "coord_origin": "TOPLEFT" }, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification." }, { "label": "text", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 453.07, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 462.02, "r_x1": 423.26, "r_y1": 462.02, "r_x2": 423.26, "r_y2": 453.07, "r_x3": 320.82, "r_y3": 453.07, "coord_origin": "TOPLEFT" }, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.27, "r_y0": 462.09, "r_x1": 545.11, "r_y1": 462.09, "r_x2": 545.11, "r_y2": 453.19, "r_x3": 423.27, "r_y3": 453.19, "coord_origin": "TOPLEFT" }, "text": ": In this type of network, one", "orig": ": In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 474.05, "r_x1": 545.12, "r_y1": 474.05, "r_x2": 545.12, "r_y2": 465.14, "r_x3": 308.86, "r_y3": 465.14, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence of tokens starting from an encoded", "orig": "predicts a sequence of tokens starting from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 486.0, "r_x1": 335.7, "r_y1": 486.0, "r_x2": 335.7, "r_y2": 477.1, "r_x3": 308.86, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.85, "r_y0": 486.0, "r_x1": 545.12, "r_y1": 486.0, "r_x2": 545.12, "r_y2": 477.1, "r_x3": 345.85, "r_y3": 477.1, "coord_origin": "TOPLEFT" }, "text": "Such sequences of tokens can be HTML table", "orig": "Such sequences of tokens can be HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.96, "r_x1": 545.11, "r_y1": 497.96, "r_x2": 545.11, "r_y2": 489.05, "r_x3": 308.86, "r_y3": 489.05, "coord_origin": "TOPLEFT" }, "text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.91, "r_x1": 545.11, "r_y1": 509.91, "r_x2": 545.11, "r_y2": 501.01, "r_x3": 308.86, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.87, "r_x1": 545.12, "r_y1": 521.87, "r_x2": 545.12, "r_y2": 512.96, "r_x3": 308.86, "r_y3": 512.96, "coord_origin": "TOPLEFT" }, "text": "formed into the other. There are however subtle variations", "orig": "formed into the other. There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.82, "r_x1": 545.12, "r_y1": 533.82, "r_x2": 545.12, "r_y2": 524.92, "r_x3": 308.86, "r_y3": 524.92, "coord_origin": "TOPLEFT" }, "text": "in the Image-to-Text networks. The easiest network archi-", "orig": "in the Image-to-Text networks. The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.78, "r_x1": 420.94, "r_y1": 545.78, "r_x2": 420.94, "r_y2": 536.87, "r_x3": 308.86, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "tectures are \u201cimage-encoder", "orig": "tectures are \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.59, "r_y0": 545.56, "r_x1": 433.56, "r_y1": 545.56, "r_x2": 433.56, "r_y2": 536.16, "r_x3": 423.59, "r_y3": 536.16, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.21, "r_y0": 545.78, "r_x1": 545.11, "r_y1": 545.78, "r_x2": 545.11, "r_y2": 536.87, "r_x3": 436.21, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "text-decoder\u201d (IETD), sim-", "orig": "text-decoder\u201d (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.73, "r_x1": 545.12, "r_y1": 557.73, "r_x2": 545.12, "r_y2": 548.83, "r_x3": 308.86, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.69, "r_x1": 545.11, "r_y1": 569.69, "r_x2": 545.11, "r_y2": 560.78, "r_x3": 308.86, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.64, "r_x1": 545.11, "r_y1": 581.64, "r_x2": 545.11, "r_y2": 572.74, "r_x3": 308.86, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "the LaTeX/HTML string of the entire table, i.e. the sym-", "orig": "the LaTeX/HTML string of the entire table, i.e. the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.6, "r_x1": 545.12, "r_y1": 593.6, "r_x2": 545.12, "r_y2": 584.69, "r_x3": 308.86, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.56, "r_x1": 497.08, "r_y1": 605.56, "r_x2": 497.08, "r_y2": 596.65, "r_x3": 308.86, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "table. Another approach is the \u201cimage-encoder", "orig": "table. Another approach is the \u201cimage-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.8, "r_y0": 605.34, "r_x1": 509.77, "r_y1": 605.34, "r_x2": 509.77, "r_y2": 595.93, "r_x3": 499.8, "r_y3": 595.93, "coord_origin": "TOPLEFT" }, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.5, "r_y0": 605.56, "r_x1": 545.11, "r_y1": 605.56, "r_x2": 545.11, "r_y2": 596.65, "r_x3": 512.5, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.51, "r_x1": 545.12, "r_y1": 617.51, "r_x2": 545.12, "r_y2": 608.6, "r_x3": 308.86, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "coder\u201d (IEDD) networks. In these type of networks, one has", "orig": "coder\u201d (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.47, "r_x1": 545.12, "r_y1": 629.47, "r_x2": 545.12, "r_y2": 620.56, "r_x3": 308.86, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.42, "r_x1": 364.78, "r_y1": 641.42, "r_x2": 364.78, "r_y2": 632.51, "r_x3": 308.86, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.57, "r_y0": 641.19, "r_x1": 415.61, "r_y1": 641.19, "r_x2": 415.61, "r_y2": 632.6, "r_x3": 367.57, "r_y3": 632.6, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.61, "r_y0": 641.42, "r_x1": 545.12, "r_y1": 641.42, "r_x2": 545.12, "r_y2": 632.51, "r_x3": 415.61, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": ", i.e. it only produces the HTM-", "orig": ", i.e. it only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.1, "r_x1": 373.6, "r_y1": 665.1, "r_x2": 373.6, "r_y2": 656.51, "r_x3": 308.86, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.91, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.43, "r_x3": 376.91, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.01, "r_x1": 356.9, "r_y1": 689.01, "r_x2": 356.9, "r_y2": 680.42, "r_x3": 308.86, "r_y3": 680.42, "coord_origin": "TOPLEFT" }, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.13, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 357.13, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": ") to generate the textual content of each table", "orig": ") to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "cell. The network architecture of IEDD is certainly more", "orig": "cell. The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the" } ], "headers": [ { "label": "page_footer", "id": 15, "page_no": 1, "cluster": { "id": 15, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" } ] } }, { "page_no": 2, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 250.15, "r_y1": 84.11, "r_x2": 250.15, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.13, "r_x1": 70.37, "r_y1": 96.13, "r_x2": 70.37, "r_y2": 87.22, "r_x3": 62.07, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.93, "r_y0": 96.13, "r_x1": 110.95, "r_y1": 96.13, "r_x2": 110.95, "r_y2": 87.22, "r_x3": 76.93, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54, "r_y0": 96.13, "r_x1": 136.26, "r_y1": 96.13, "r_x2": 136.26, "r_y2": 87.22, "r_x3": 118.54, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82, "r_y0": 96.13, "r_x1": 175.37, "r_y1": 96.13, "r_x2": 175.37, "r_y2": 87.22, "r_x3": 142.82, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.95, "r_y0": 96.13, "r_x1": 232.84, "r_y1": 96.13, "r_x2": 232.84, "r_y2": 87.22, "r_x3": 181.95, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41, "r_y0": 96.13, "r_x1": 265.41, "r_y1": 96.13, "r_x2": 265.41, "r_y2": 87.22, "r_x3": 239.41, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.98, "r_y0": 96.13, "r_x1": 286.36, "r_y1": 96.13, "r_x2": 286.36, "r_y2": 87.22, "r_x3": 271.98, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.08, "r_x1": 286.37, "r_y1": 108.08, "r_x2": 286.37, "r_y2": 99.17, "r_x3": 50.11, "r_y3": 99.17, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.04, "r_x1": 286.37, "r_y1": 120.04, "r_x2": 286.37, "r_y2": 111.13, "r_x3": 50.11, "r_y3": 111.13, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.99, "r_x1": 286.37, "r_y1": 131.99, "r_x2": 286.37, "r_y2": 123.09, "r_x3": 50.11, "r_y3": 123.09, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.95, "r_x1": 286.37, "r_y1": 143.95, "r_x2": 286.37, "r_y2": 135.04, "r_x3": 50.11, "r_y3": 135.04, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.9, "r_x1": 286.37, "r_y1": 155.9, "r_x2": 286.37, "r_y2": 147.0, "r_x3": 50.11, "r_y3": 147.0, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 167.86, "r_x1": 286.37, "r_y1": 167.86, "r_x2": 286.37, "r_y2": 158.95, "r_x3": 50.11, "r_y3": 158.95, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 179.81, "r_x1": 286.37, "r_y1": 179.81, "r_x2": 286.37, "r_y2": 170.91, "r_x3": 50.11, "r_y3": 170.91, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 191.77, "r_x1": 286.37, "r_y1": 191.77, "r_x2": 286.37, "r_y2": 182.86, "r_x3": 50.11, "r_y3": 182.86, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 203.72, "r_x1": 286.37, "r_y1": 203.72, "r_x2": 286.37, "r_y2": 194.82, "r_x3": 50.11, "r_y3": 194.82, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 215.68, "r_x1": 286.37, "r_y1": 215.68, "r_x2": 286.37, "r_y2": 206.77, "r_x3": 50.11, "r_y3": 206.77, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 227.63, "r_x1": 286.37, "r_y1": 227.63, "r_x2": 286.37, "r_y2": 218.73, "r_x3": 50.11, "r_y3": 218.73, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 239.59, "r_x1": 286.37, "r_y1": 239.59, "r_x2": 286.37, "r_y2": 230.68, "r_x3": 50.11, "r_y3": 230.68, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 251.54, "r_x1": 286.37, "r_y1": 251.54, "r_x2": 286.37, "r_y2": 242.64, "r_x3": 50.11, "r_y3": 242.64, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 263.5, "r_x1": 286.37, "r_y1": 263.5, "r_x2": 286.37, "r_y2": 254.59, "r_x3": 50.11, "r_y3": 254.59, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 275.45, "r_x1": 64.78, "r_y1": 275.45, "r_x2": 64.78, "r_y2": 266.55, "r_x3": 50.11, "r_y3": 266.55, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 287.4, "r_x1": 171.57, "r_y1": 287.4, "r_x2": 171.57, "r_y2": 278.44, "r_x3": 62.07, "r_y3": 278.44, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.57, "r_y0": 287.47, "r_x1": 174.34, "r_y1": 287.47, "r_x2": 174.34, "r_y2": 278.56, "r_x3": 171.57, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.19, "r_y0": 287.47, "r_x1": 286.36, "r_y1": 287.47, "r_x2": 286.36, "r_y2": 278.56, "r_x3": 185.19, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 299.42, "r_x1": 286.37, "r_y1": 299.42, "r_x2": 286.37, "r_y2": 290.51, "r_x3": 50.11, "r_y3": 290.51, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 311.38, "r_x1": 131.17, "r_y1": 311.38, "r_x2": 131.17, "r_y2": 302.47, "r_x3": 50.11, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.85, "r_y0": 311.38, "r_x1": 286.37, "r_y1": 311.38, "r_x2": 286.37, "r_y2": 302.47, "r_x3": 138.85, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.33, "r_x1": 286.37, "r_y1": 323.33, "r_x2": 286.37, "r_y2": 314.42, "r_x3": 50.11, "r_y3": 314.42, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.29, "r_x1": 286.37, "r_y1": 335.29, "r_x2": 286.37, "r_y2": 326.38, "r_x3": 50.11, "r_y3": 326.38, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.24, "r_x1": 286.37, "r_y1": 347.24, "r_x2": 286.37, "r_y2": 338.33, "r_x3": 50.11, "r_y3": 338.33, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.2, "r_x1": 286.37, "r_y1": 359.2, "r_x2": 286.37, "r_y2": 350.29, "r_x3": 50.11, "r_y3": 350.29, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.15, "r_x1": 286.37, "r_y1": 371.15, "r_x2": 286.37, "r_y2": 362.25, "r_x3": 50.11, "r_y3": 362.25, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.11, "r_x1": 286.37, "r_y1": 383.11, "r_x2": 286.37, "r_y2": 374.2, "r_x3": 50.11, "r_y3": 374.2, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.06, "r_x1": 286.37, "r_y1": 395.06, "r_x2": 286.37, "r_y2": 386.16, "r_x3": 50.11, "r_y3": 386.16, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 407.02, "r_x1": 286.37, "r_y1": 407.02, "r_x2": 286.37, "r_y2": 398.11, "r_x3": 50.11, "r_y3": 398.11, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 418.97, "r_x1": 286.37, "r_y1": 418.97, "r_x2": 286.37, "r_y2": 410.07, "r_x3": 50.11, "r_y3": 410.07, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 430.93, "r_x1": 286.37, "r_y1": 430.93, "r_x2": 286.37, "r_y2": 422.02, "r_x3": 50.11, "r_y3": 422.02, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 442.88, "r_x1": 198.24, "r_y1": 442.88, "r_x2": 198.24, "r_y2": 433.98, "r_x3": 50.11, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.93, "r_y0": 442.88, "r_x1": 286.37, "r_y1": 442.88, "r_x2": 286.37, "r_y2": 433.98, "r_x3": 205.93, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 454.84, "r_x1": 286.37, "r_y1": 454.84, "r_x2": 286.37, "r_y2": 445.93, "r_x3": 50.11, "r_y3": 445.93, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 466.79, "r_x1": 286.37, "r_y1": 466.79, "r_x2": 286.37, "r_y2": 457.89, "r_x3": 50.11, "r_y3": 457.89, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 478.75, "r_x1": 286.37, "r_y1": 478.75, "r_x2": 286.37, "r_y2": 469.84, "r_x3": 50.11, "r_y3": 469.84, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 490.7, "r_x1": 186.5, "r_y1": 490.7, "r_x2": 186.5, "r_y2": 481.8, "r_x3": 50.11, "r_y3": 481.8, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 502.65, "r_x1": 252.88, "r_y1": 502.65, "r_x2": 252.88, "r_y2": 493.69, "r_x3": 62.07, "r_y3": 493.69, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88, "r_y0": 502.71, "r_x1": 286.37, "r_y1": 502.71, "r_x2": 286.37, "r_y2": 493.81, "r_x3": 252.88, "r_y3": 493.81, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.67, "r_x1": 286.37, "r_y1": 514.67, "r_x2": 286.37, "r_y2": 505.76, "r_x3": 50.11, "r_y3": 505.76, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 526.62, "r_x1": 286.37, "r_y1": 526.62, "r_x2": 286.37, "r_y2": 517.72, "r_x3": 50.11, "r_y3": 517.72, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 538.58, "r_x1": 286.37, "r_y1": 538.58, "r_x2": 286.37, "r_y2": 529.67, "r_x3": 50.11, "r_y3": 529.67, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.54, "r_x1": 286.37, "r_y1": 550.54, "r_x2": 286.37, "r_y2": 541.63, "r_x3": 50.11, "r_y3": 541.63, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 562.49, "r_x1": 286.37, "r_y1": 562.49, "r_x2": 286.37, "r_y2": 553.58, "r_x3": 50.11, "r_y3": 553.58, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 574.45, "r_x1": 286.37, "r_y1": 574.45, "r_x2": 286.37, "r_y2": 565.54, "r_x3": 50.11, "r_y3": 565.54, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.4, "r_x1": 286.37, "r_y1": 586.4, "r_x2": 286.37, "r_y2": 577.49, "r_x3": 50.11, "r_y3": 577.49, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 598.36, "r_x1": 286.37, "r_y1": 598.36, "r_x2": 286.37, "r_y2": 589.45, "r_x3": 50.11, "r_y3": 589.45, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 610.31, "r_x1": 286.37, "r_y1": 610.31, "r_x2": 286.37, "r_y2": 601.4, "r_x3": 50.11, "r_y3": 601.4, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 622.27, "r_x1": 175.99, "r_y1": 622.27, "r_x2": 175.99, "r_y2": 613.36, "r_x3": 50.11, "r_y3": 613.36, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.69, "r_x1": 57.82, "r_y1": 646.69, "r_x2": 57.82, "r_y2": 635.94, "r_x3": 50.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.11, "r_y0": 646.69, "r_x1": 105.23, "r_y1": 646.69, "r_x2": 105.23, "r_y2": 635.94, "r_x3": 68.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 665.33, "r_x1": 286.36, "r_y1": 665.33, "r_x2": 286.36, "r_y2": 656.43, "r_x3": 62.07, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 166.25, "r_y1": 701.2, "r_x2": 166.25, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.69, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 173.69, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 276.74, "r_x1": 346.06, "r_y1": 276.74, "r_x2": 346.06, "r_y2": 267.84, "r_x3": 308.86, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49, "r_y0": 276.74, "r_x1": 545.12, "r_y1": 276.74, "r_x2": 545.12, "r_y2": 267.84, "r_x3": 354.49, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 288.7, "r_x1": 498.57, "r_y1": 288.7, "r_x2": 498.57, "r_y2": 279.79, "r_x3": 308.86, "r_y3": 279.79, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 326.38, "r_x1": 437.27, "r_y1": 326.38, "r_x2": 437.27, "r_y2": 317.47, "r_x3": 308.86, "r_y3": 317.47, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 340.44, "r_x1": 545.12, "r_y1": 340.44, "r_x2": 545.12, "r_y2": 331.53, "r_x3": 320.82, "r_y3": 331.53, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.39, "r_x1": 545.12, "r_y1": 352.39, "r_x2": 545.12, "r_y2": 343.49, "r_x3": 308.86, "r_y3": 343.49, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.35, "r_x1": 545.12, "r_y1": 364.35, "r_x2": 545.12, "r_y2": 355.44, "r_x3": 308.86, "r_y3": 355.44, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 376.3, "r_x1": 545.12, "r_y1": 376.3, "r_x2": 545.12, "r_y2": 367.4, "r_x3": 308.86, "r_y3": 367.4, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.26, "r_x1": 545.12, "r_y1": 388.26, "r_x2": 545.12, "r_y2": 379.35, "r_x3": 308.86, "r_y3": 379.35, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.21, "r_x1": 545.12, "r_y1": 400.21, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 308.86, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.26, "r_x3": 308.86, "r_y3": 403.26, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.12, "r_x1": 545.12, "r_y1": 424.12, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.17, "r_x3": 308.86, "r_y3": 427.17, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.03, "r_x1": 545.12, "r_y1": 448.03, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 545.12, "r_y1": 459.99, "r_x2": 545.12, "r_y2": 451.08, "r_x3": 308.86, "r_y3": 451.08, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 471.94, "r_x1": 545.12, "r_y1": 471.94, "r_x2": 545.12, "r_y2": 463.04, "r_x3": 308.86, "r_y3": 463.04, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 483.9, "r_x1": 545.12, "r_y1": 483.9, "r_x2": 545.12, "r_y2": 474.99, "r_x3": 308.86, "r_y3": 474.99, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 495.86, "r_x1": 545.12, "r_y1": 495.86, "r_x2": 545.12, "r_y2": 486.95, "r_x3": 308.86, "r_y3": 486.95, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 507.81, "r_x1": 545.12, "r_y1": 507.81, "r_x2": 545.12, "r_y2": 498.9, "r_x3": 308.86, "r_y3": 498.9, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 519.77, "r_x1": 545.12, "r_y1": 519.77, "r_x2": 545.12, "r_y2": 510.86, "r_x3": 308.86, "r_y3": 510.86, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 531.72, "r_x1": 545.12, "r_y1": 531.72, "r_x2": 545.12, "r_y2": 522.81, "r_x3": 308.86, "r_y3": 522.81, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 543.68, "r_x1": 545.12, "r_y1": 543.68, "r_x2": 545.12, "r_y2": 534.77, "r_x3": 308.86, "r_y3": 534.77, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.63, "r_x1": 545.12, "r_y1": 555.63, "r_x2": 545.12, "r_y2": 546.72, "r_x3": 308.86, "r_y3": 546.72, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.59, "r_x1": 545.12, "r_y1": 567.59, "r_x2": 545.12, "r_y2": 558.68, "r_x3": 308.86, "r_y3": 558.68, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 579.54, "r_x1": 545.12, "r_y1": 579.54, "r_x2": 545.12, "r_y2": 570.64, "r_x3": 308.86, "r_y3": 570.64, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 591.5, "r_x1": 545.11, "r_y1": 591.5, "r_x2": 545.11, "r_y2": 582.59, "r_x3": 308.86, "r_y3": 582.59, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 603.45, "r_x1": 545.12, "r_y1": 603.45, "r_x2": 545.12, "r_y2": 594.55, "r_x3": 308.86, "r_y3": 594.55, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 615.41, "r_x1": 545.12, "r_y1": 615.41, "r_x2": 545.12, "r_y2": 606.5, "r_x3": 308.86, "r_y3": 606.5, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 627.36, "r_x1": 348.16, "r_y1": 627.36, "r_x2": 348.16, "r_y2": 618.46, "r_x3": 308.86, "r_y3": 618.46, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 641.42, "r_x1": 545.11, "r_y1": 641.42, "r_x2": 545.11, "r_y2": 632.51, "r_x3": 320.82, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.42, "r_x3": 308.86, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 250.15, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 250.15, "r_y1": 84.11, "r_x2": 250.15, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 87.22, "r": 286.37, "b": 275.45, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.13, "r_x1": 70.37, "r_y1": 96.13, "r_x2": 70.37, "r_y2": 87.22, "r_x3": 62.07, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.93, "r_y0": 96.13, "r_x1": 110.95, "r_y1": 96.13, "r_x2": 110.95, "r_y2": 87.22, "r_x3": 76.93, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54, "r_y0": 96.13, "r_x1": 136.26, "r_y1": 96.13, "r_x2": 136.26, "r_y2": 87.22, "r_x3": 118.54, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82, "r_y0": 96.13, "r_x1": 175.37, "r_y1": 96.13, "r_x2": 175.37, "r_y2": 87.22, "r_x3": 142.82, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.95, "r_y0": 96.13, "r_x1": 232.84, "r_y1": 96.13, "r_x2": 232.84, "r_y2": 87.22, "r_x3": 181.95, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41, "r_y0": 96.13, "r_x1": 265.41, "r_y1": 96.13, "r_x2": 265.41, "r_y2": 87.22, "r_x3": 239.41, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.98, "r_y0": 96.13, "r_x1": 286.36, "r_y1": 96.13, "r_x2": 286.36, "r_y2": 87.22, "r_x3": 271.98, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.08, "r_x1": 286.37, "r_y1": 108.08, "r_x2": 286.37, "r_y2": 99.17, "r_x3": 50.11, "r_y3": 99.17, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.04, "r_x1": 286.37, "r_y1": 120.04, "r_x2": 286.37, "r_y2": 111.13, "r_x3": 50.11, "r_y3": 111.13, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.99, "r_x1": 286.37, "r_y1": 131.99, "r_x2": 286.37, "r_y2": 123.09, "r_x3": 50.11, "r_y3": 123.09, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.95, "r_x1": 286.37, "r_y1": 143.95, "r_x2": 286.37, "r_y2": 135.04, "r_x3": 50.11, "r_y3": 135.04, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.9, "r_x1": 286.37, "r_y1": 155.9, "r_x2": 286.37, "r_y2": 147.0, "r_x3": 50.11, "r_y3": 147.0, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 167.86, "r_x1": 286.37, "r_y1": 167.86, "r_x2": 286.37, "r_y2": 158.95, "r_x3": 50.11, "r_y3": 158.95, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 179.81, "r_x1": 286.37, "r_y1": 179.81, "r_x2": 286.37, "r_y2": 170.91, "r_x3": 50.11, "r_y3": 170.91, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 191.77, "r_x1": 286.37, "r_y1": 191.77, "r_x2": 286.37, "r_y2": 182.86, "r_x3": 50.11, "r_y3": 182.86, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 203.72, "r_x1": 286.37, "r_y1": 203.72, "r_x2": 286.37, "r_y2": 194.82, "r_x3": 50.11, "r_y3": 194.82, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 215.68, "r_x1": 286.37, "r_y1": 215.68, "r_x2": 286.37, "r_y2": 206.77, "r_x3": 50.11, "r_y3": 206.77, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 227.63, "r_x1": 286.37, "r_y1": 227.63, "r_x2": 286.37, "r_y2": 218.73, "r_x3": 50.11, "r_y3": 218.73, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 239.59, "r_x1": 286.37, "r_y1": 239.59, "r_x2": 286.37, "r_y2": 230.68, "r_x3": 50.11, "r_y3": 230.68, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 251.54, "r_x1": 286.37, "r_y1": 251.54, "r_x2": 286.37, "r_y2": 242.64, "r_x3": 50.11, "r_y3": 242.64, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 263.5, "r_x1": 286.37, "r_y1": 263.5, "r_x2": 286.37, "r_y2": 254.59, "r_x3": 50.11, "r_y3": 254.59, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 275.45, "r_x1": 64.78, "r_y1": 275.45, "r_x2": 64.78, "r_y2": 266.55, "r_x3": 50.11, "r_y3": 266.55, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 278.44, "r": 286.37, "b": 490.7, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 287.4, "r_x1": 171.57, "r_y1": 287.4, "r_x2": 171.57, "r_y2": 278.44, "r_x3": 62.07, "r_y3": 278.44, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.57, "r_y0": 287.47, "r_x1": 174.34, "r_y1": 287.47, "r_x2": 174.34, "r_y2": 278.56, "r_x3": 171.57, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.19, "r_y0": 287.47, "r_x1": 286.36, "r_y1": 287.47, "r_x2": 286.36, "r_y2": 278.56, "r_x3": 185.19, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 299.42, "r_x1": 286.37, "r_y1": 299.42, "r_x2": 286.37, "r_y2": 290.51, "r_x3": 50.11, "r_y3": 290.51, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 311.38, "r_x1": 131.17, "r_y1": 311.38, "r_x2": 131.17, "r_y2": 302.47, "r_x3": 50.11, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.85, "r_y0": 311.38, "r_x1": 286.37, "r_y1": 311.38, "r_x2": 286.37, "r_y2": 302.47, "r_x3": 138.85, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.33, "r_x1": 286.37, "r_y1": 323.33, "r_x2": 286.37, "r_y2": 314.42, "r_x3": 50.11, "r_y3": 314.42, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.29, "r_x1": 286.37, "r_y1": 335.29, "r_x2": 286.37, "r_y2": 326.38, "r_x3": 50.11, "r_y3": 326.38, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.24, "r_x1": 286.37, "r_y1": 347.24, "r_x2": 286.37, "r_y2": 338.33, "r_x3": 50.11, "r_y3": 338.33, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.2, "r_x1": 286.37, "r_y1": 359.2, "r_x2": 286.37, "r_y2": 350.29, "r_x3": 50.11, "r_y3": 350.29, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.15, "r_x1": 286.37, "r_y1": 371.15, "r_x2": 286.37, "r_y2": 362.25, "r_x3": 50.11, "r_y3": 362.25, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.11, "r_x1": 286.37, "r_y1": 383.11, "r_x2": 286.37, "r_y2": 374.2, "r_x3": 50.11, "r_y3": 374.2, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.06, "r_x1": 286.37, "r_y1": 395.06, "r_x2": 286.37, "r_y2": 386.16, "r_x3": 50.11, "r_y3": 386.16, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 407.02, "r_x1": 286.37, "r_y1": 407.02, "r_x2": 286.37, "r_y2": 398.11, "r_x3": 50.11, "r_y3": 398.11, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 418.97, "r_x1": 286.37, "r_y1": 418.97, "r_x2": 286.37, "r_y2": 410.07, "r_x3": 50.11, "r_y3": 410.07, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 430.93, "r_x1": 286.37, "r_y1": 430.93, "r_x2": 286.37, "r_y2": 422.02, "r_x3": 50.11, "r_y3": 422.02, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 442.88, "r_x1": 198.24, "r_y1": 442.88, "r_x2": 198.24, "r_y2": 433.98, "r_x3": 50.11, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.93, "r_y0": 442.88, "r_x1": 286.37, "r_y1": 442.88, "r_x2": 286.37, "r_y2": 433.98, "r_x3": 205.93, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 454.84, "r_x1": 286.37, "r_y1": 454.84, "r_x2": 286.37, "r_y2": 445.93, "r_x3": 50.11, "r_y3": 445.93, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 466.79, "r_x1": 286.37, "r_y1": 466.79, "r_x2": 286.37, "r_y2": 457.89, "r_x3": 50.11, "r_y3": 457.89, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 478.75, "r_x1": 286.37, "r_y1": 478.75, "r_x2": 286.37, "r_y2": 469.84, "r_x3": 50.11, "r_y3": 469.84, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 490.7, "r_x1": 186.5, "r_y1": 490.7, "r_x2": 186.5, "r_y2": 481.8, "r_x3": 50.11, "r_y3": 481.8, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 493.69, "r": 286.37, "b": 622.27, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 502.65, "r_x1": 252.88, "r_y1": 502.65, "r_x2": 252.88, "r_y2": 493.69, "r_x3": 62.07, "r_y3": 493.69, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88, "r_y0": 502.71, "r_x1": 286.37, "r_y1": 502.71, "r_x2": 286.37, "r_y2": 493.81, "r_x3": 252.88, "r_y3": 493.81, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.67, "r_x1": 286.37, "r_y1": 514.67, "r_x2": 286.37, "r_y2": 505.76, "r_x3": 50.11, "r_y3": 505.76, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 526.62, "r_x1": 286.37, "r_y1": 526.62, "r_x2": 286.37, "r_y2": 517.72, "r_x3": 50.11, "r_y3": 517.72, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 538.58, "r_x1": 286.37, "r_y1": 538.58, "r_x2": 286.37, "r_y2": 529.67, "r_x3": 50.11, "r_y3": 529.67, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.54, "r_x1": 286.37, "r_y1": 550.54, "r_x2": 286.37, "r_y2": 541.63, "r_x3": 50.11, "r_y3": 541.63, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 562.49, "r_x1": 286.37, "r_y1": 562.49, "r_x2": 286.37, "r_y2": 553.58, "r_x3": 50.11, "r_y3": 553.58, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 574.45, "r_x1": 286.37, "r_y1": 574.45, "r_x2": 286.37, "r_y2": 565.54, "r_x3": 50.11, "r_y3": 565.54, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.4, "r_x1": 286.37, "r_y1": 586.4, "r_x2": 286.37, "r_y2": 577.49, "r_x3": 50.11, "r_y3": 577.49, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 598.36, "r_x1": 286.37, "r_y1": 598.36, "r_x2": 286.37, "r_y2": 589.45, "r_x3": 50.11, "r_y3": 589.45, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 610.31, "r_x1": 286.37, "r_y1": 610.31, "r_x2": 286.37, "r_y2": 601.4, "r_x3": 50.11, "r_y3": 601.4, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 622.27, "r_x1": 175.99, "r_y1": 622.27, "r_x2": 175.99, "r_y2": 613.36, "r_x3": 50.11, "r_y3": 613.36, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "section_header", "bbox": { "l": 50.11, "t": 635.94, "r": 105.23, "b": 646.69, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.69, "r_x1": 57.82, "r_y1": 646.69, "r_x2": 57.82, "r_y2": 635.94, "r_x3": 50.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.11, "r_y0": 646.69, "r_x1": 105.23, "r_y1": 646.69, "r_x2": 105.23, "r_y2": 635.94, "r_x3": 68.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 656.43, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 665.33, "r_x1": 286.36, "r_y1": 665.33, "r_x2": 286.36, "r_y2": 656.43, "r_x3": 62.07, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 166.25, "r_y1": 701.2, "r_x2": 166.25, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.69, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 173.69, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 312.1, "t": 78.44, "r": 550.39, "b": 250.61, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.8, "t": 79.81, "r": 486.85, "b": 88.56, "coord_origin": "TOPLEFT" }, "confidence": 0.569, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.77, "t": 242.03, "r": 469.79, "b": 250.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.98, "t": 233.42, "r": 324.79, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.48, "t": 233.42, "r": 418.11, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.85, "t": 233.42, "r": 508.48, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.3, "t": 233.42, "r": 372.93, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.67, "t": 233.42, "r": 463.3, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.04, "t": 233.42, "r": 549.67, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04, "t": 230.45, "r": 319.86, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.63, "t": 198.69, "r": 316.44, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.44, "t": 198.69, "r": 320.26, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.15, "t": 168.1, "r": 316.97, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96, "t": 168.1, "r": 320.78, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.93, "t": 136.59, "r": 316.75, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74, "t": 136.59, "r": 320.56, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48, "t": 105.6, "r": 316.3, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.3, "t": 105.6, "r": 320.11, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48, "t": 212.26, "r": 316.3, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.3, "t": 212.26, "r": 320.11, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.08, "t": 183.72, "r": 316.89, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89, "t": 183.72, "r": 320.71, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76, "t": 152.47, "r": 316.58, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.58, "t": 152.47, "r": 320.39, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.2, "t": 120.57, "r": 316.01, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01, "t": 120.57, "r": 319.83, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.82, "t": 90.11, "r": 316.63, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63, "t": 90.11, "r": 320.45, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17, "t": 222.73, "r": 536.94, "b": 230.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.88, "t": 108.27, "r": 547.61, "b": 115.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.77, "t": 130.78, "r": 542.74, "b": 138.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.8, "t": 153.92, "r": 542.76, "b": 161.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.57, "t": 176.76, "r": 542.54, "b": 184.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.15, "t": 199.65, "r": 542.11, "b": 206.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 7, "label": "caption", "bbox": { "l": 308.86, "t": 267.84, "r": 545.12, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 276.74, "r_x1": 346.06, "r_y1": 276.74, "r_x2": 346.06, "r_y2": 267.84, "r_x3": 308.86, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49, "r_y0": 276.74, "r_x1": 545.12, "r_y1": 276.74, "r_x2": 545.12, "r_y2": 267.84, "r_x3": 354.49, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 288.7, "r_x1": 498.57, "r_y1": 288.7, "r_x2": 498.57, "r_y2": 279.79, "r_x3": 308.86, "r_y3": 279.79, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 317.47, "r": 437.27, "b": 326.38, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 326.38, "r_x1": 437.27, "r_y1": 326.38, "r_x2": 437.27, "r_y2": 317.47, "r_x3": 308.86, "r_y3": 317.47, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 331.53, "r": 545.12, "b": 627.36, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 340.44, "r_x1": 545.12, "r_y1": 340.44, "r_x2": 545.12, "r_y2": 331.53, "r_x3": 320.82, "r_y3": 331.53, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.39, "r_x1": 545.12, "r_y1": 352.39, "r_x2": 545.12, "r_y2": 343.49, "r_x3": 308.86, "r_y3": 343.49, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.35, "r_x1": 545.12, "r_y1": 364.35, "r_x2": 545.12, "r_y2": 355.44, "r_x3": 308.86, "r_y3": 355.44, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 376.3, "r_x1": 545.12, "r_y1": 376.3, "r_x2": 545.12, "r_y2": 367.4, "r_x3": 308.86, "r_y3": 367.4, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.26, "r_x1": 545.12, "r_y1": 388.26, "r_x2": 545.12, "r_y2": 379.35, "r_x3": 308.86, "r_y3": 379.35, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.21, "r_x1": 545.12, "r_y1": 400.21, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 308.86, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.26, "r_x3": 308.86, "r_y3": 403.26, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.12, "r_x1": 545.12, "r_y1": 424.12, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.17, "r_x3": 308.86, "r_y3": 427.17, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.03, "r_x1": 545.12, "r_y1": 448.03, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 545.12, "r_y1": 459.99, "r_x2": 545.12, "r_y2": 451.08, "r_x3": 308.86, "r_y3": 451.08, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 471.94, "r_x1": 545.12, "r_y1": 471.94, "r_x2": 545.12, "r_y2": 463.04, "r_x3": 308.86, "r_y3": 463.04, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 483.9, "r_x1": 545.12, "r_y1": 483.9, "r_x2": 545.12, "r_y2": 474.99, "r_x3": 308.86, "r_y3": 474.99, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 495.86, "r_x1": 545.12, "r_y1": 495.86, "r_x2": 545.12, "r_y2": 486.95, "r_x3": 308.86, "r_y3": 486.95, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 507.81, "r_x1": 545.12, "r_y1": 507.81, "r_x2": 545.12, "r_y2": 498.9, "r_x3": 308.86, "r_y3": 498.9, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 519.77, "r_x1": 545.12, "r_y1": 519.77, "r_x2": 545.12, "r_y2": 510.86, "r_x3": 308.86, "r_y3": 510.86, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 531.72, "r_x1": 545.12, "r_y1": 531.72, "r_x2": 545.12, "r_y2": 522.81, "r_x3": 308.86, "r_y3": 522.81, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 543.68, "r_x1": 545.12, "r_y1": 543.68, "r_x2": 545.12, "r_y2": 534.77, "r_x3": 308.86, "r_y3": 534.77, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.63, "r_x1": 545.12, "r_y1": 555.63, "r_x2": 545.12, "r_y2": 546.72, "r_x3": 308.86, "r_y3": 546.72, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.59, "r_x1": 545.12, "r_y1": 567.59, "r_x2": 545.12, "r_y2": 558.68, "r_x3": 308.86, "r_y3": 558.68, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 579.54, "r_x1": 545.12, "r_y1": 579.54, "r_x2": 545.12, "r_y2": 570.64, "r_x3": 308.86, "r_y3": 570.64, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 591.5, "r_x1": 545.11, "r_y1": 591.5, "r_x2": 545.11, "r_y2": 582.59, "r_x3": 308.86, "r_y3": 582.59, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 603.45, "r_x1": 545.12, "r_y1": 603.45, "r_x2": 545.12, "r_y2": 594.55, "r_x3": 308.86, "r_y3": 594.55, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 615.41, "r_x1": 545.12, "r_y1": 615.41, "r_x2": 545.12, "r_y2": 606.5, "r_x3": 308.86, "r_y3": 606.5, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 627.36, "r_x1": 348.16, "r_y1": 627.36, "r_x2": 348.16, "r_y2": 618.46, "r_x3": 308.86, "r_y3": 618.46, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 632.51, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 641.42, "r_x1": 545.11, "r_y1": 641.42, "r_x2": 545.11, "r_y2": 632.51, "r_x3": 320.82, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.42, "r_x3": 308.86, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 10, "page_no": 2, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 250.15, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 250.15, "r_y1": 84.11, "r_x2": 250.15, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tag-decoder which is constrained to the table-tags." }, { "label": "text", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 87.22, "r": 286.37, "b": 275.45, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.13, "r_x1": 70.37, "r_y1": 96.13, "r_x2": 70.37, "r_y2": 87.22, "r_x3": 62.07, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.93, "r_y0": 96.13, "r_x1": 110.95, "r_y1": 96.13, "r_x2": 110.95, "r_y2": 87.22, "r_x3": 76.93, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54, "r_y0": 96.13, "r_x1": 136.26, "r_y1": 96.13, "r_x2": 136.26, "r_y2": 87.22, "r_x3": 118.54, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82, "r_y0": 96.13, "r_x1": 175.37, "r_y1": 96.13, "r_x2": 175.37, "r_y2": 87.22, "r_x3": 142.82, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.95, "r_y0": 96.13, "r_x1": 232.84, "r_y1": 96.13, "r_x2": 232.84, "r_y2": 87.22, "r_x3": 181.95, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41, "r_y0": 96.13, "r_x1": 265.41, "r_y1": 96.13, "r_x2": 265.41, "r_y2": 87.22, "r_x3": 239.41, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.98, "r_y0": 96.13, "r_x1": 286.36, "r_y1": 96.13, "r_x2": 286.36, "r_y2": 87.22, "r_x3": 271.98, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.08, "r_x1": 286.37, "r_y1": 108.08, "r_x2": 286.37, "r_y2": 99.17, "r_x3": 50.11, "r_y3": 99.17, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.04, "r_x1": 286.37, "r_y1": 120.04, "r_x2": 286.37, "r_y2": 111.13, "r_x3": 50.11, "r_y3": 111.13, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.99, "r_x1": 286.37, "r_y1": 131.99, "r_x2": 286.37, "r_y2": 123.09, "r_x3": 50.11, "r_y3": 123.09, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.95, "r_x1": 286.37, "r_y1": 143.95, "r_x2": 286.37, "r_y2": 135.04, "r_x3": 50.11, "r_y3": 135.04, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.9, "r_x1": 286.37, "r_y1": 155.9, "r_x2": 286.37, "r_y2": 147.0, "r_x3": 50.11, "r_y3": 147.0, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 167.86, "r_x1": 286.37, "r_y1": 167.86, "r_x2": 286.37, "r_y2": 158.95, "r_x3": 50.11, "r_y3": 158.95, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 179.81, "r_x1": 286.37, "r_y1": 179.81, "r_x2": 286.37, "r_y2": 170.91, "r_x3": 50.11, "r_y3": 170.91, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 191.77, "r_x1": 286.37, "r_y1": 191.77, "r_x2": 286.37, "r_y2": 182.86, "r_x3": 50.11, "r_y3": 182.86, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 203.72, "r_x1": 286.37, "r_y1": 203.72, "r_x2": 286.37, "r_y2": 194.82, "r_x3": 50.11, "r_y3": 194.82, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 215.68, "r_x1": 286.37, "r_y1": 215.68, "r_x2": 286.37, "r_y2": 206.77, "r_x3": 50.11, "r_y3": 206.77, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 227.63, "r_x1": 286.37, "r_y1": 227.63, "r_x2": 286.37, "r_y2": 218.73, "r_x3": 50.11, "r_y3": 218.73, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 239.59, "r_x1": 286.37, "r_y1": 239.59, "r_x2": 286.37, "r_y2": 230.68, "r_x3": 50.11, "r_y3": 230.68, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 251.54, "r_x1": 286.37, "r_y1": 251.54, "r_x2": 286.37, "r_y2": 242.64, "r_x3": 50.11, "r_y3": 242.64, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 263.5, "r_x1": 286.37, "r_y1": 263.5, "r_x2": 286.37, "r_y2": 254.59, "r_x3": 50.11, "r_y3": 254.59, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 275.45, "r_x1": 64.78, "r_y1": 275.45, "r_x2": 64.78, "r_y2": 266.55, "r_x3": 50.11, "r_y3": 266.55, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 278.44, "r": 286.37, "b": 490.7, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 287.4, "r_x1": 171.57, "r_y1": 287.4, "r_x2": 171.57, "r_y2": 278.44, "r_x3": 62.07, "r_y3": 278.44, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.57, "r_y0": 287.47, "r_x1": 174.34, "r_y1": 287.47, "r_x2": 174.34, "r_y2": 278.56, "r_x3": 171.57, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.19, "r_y0": 287.47, "r_x1": 286.36, "r_y1": 287.47, "r_x2": 286.36, "r_y2": 278.56, "r_x3": 185.19, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 299.42, "r_x1": 286.37, "r_y1": 299.42, "r_x2": 286.37, "r_y2": 290.51, "r_x3": 50.11, "r_y3": 290.51, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 311.38, "r_x1": 131.17, "r_y1": 311.38, "r_x2": 131.17, "r_y2": 302.47, "r_x3": 50.11, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.85, "r_y0": 311.38, "r_x1": 286.37, "r_y1": 311.38, "r_x2": 286.37, "r_y2": 302.47, "r_x3": 138.85, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.33, "r_x1": 286.37, "r_y1": 323.33, "r_x2": 286.37, "r_y2": 314.42, "r_x3": 50.11, "r_y3": 314.42, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.29, "r_x1": 286.37, "r_y1": 335.29, "r_x2": 286.37, "r_y2": 326.38, "r_x3": 50.11, "r_y3": 326.38, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.24, "r_x1": 286.37, "r_y1": 347.24, "r_x2": 286.37, "r_y2": 338.33, "r_x3": 50.11, "r_y3": 338.33, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.2, "r_x1": 286.37, "r_y1": 359.2, "r_x2": 286.37, "r_y2": 350.29, "r_x3": 50.11, "r_y3": 350.29, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.15, "r_x1": 286.37, "r_y1": 371.15, "r_x2": 286.37, "r_y2": 362.25, "r_x3": 50.11, "r_y3": 362.25, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.11, "r_x1": 286.37, "r_y1": 383.11, "r_x2": 286.37, "r_y2": 374.2, "r_x3": 50.11, "r_y3": 374.2, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.06, "r_x1": 286.37, "r_y1": 395.06, "r_x2": 286.37, "r_y2": 386.16, "r_x3": 50.11, "r_y3": 386.16, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 407.02, "r_x1": 286.37, "r_y1": 407.02, "r_x2": 286.37, "r_y2": 398.11, "r_x3": 50.11, "r_y3": 398.11, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 418.97, "r_x1": 286.37, "r_y1": 418.97, "r_x2": 286.37, "r_y2": 410.07, "r_x3": 50.11, "r_y3": 410.07, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 430.93, "r_x1": 286.37, "r_y1": 430.93, "r_x2": 286.37, "r_y2": 422.02, "r_x3": 50.11, "r_y3": 422.02, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 442.88, "r_x1": 198.24, "r_y1": 442.88, "r_x2": 198.24, "r_y2": 433.98, "r_x3": 50.11, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.93, "r_y0": 442.88, "r_x1": 286.37, "r_y1": 442.88, "r_x2": 286.37, "r_y2": 433.98, "r_x3": 205.93, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 454.84, "r_x1": 286.37, "r_y1": 454.84, "r_x2": 286.37, "r_y2": 445.93, "r_x3": 50.11, "r_y3": 445.93, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 466.79, "r_x1": 286.37, "r_y1": 466.79, "r_x2": 286.37, "r_y2": 457.89, "r_x3": 50.11, "r_y3": 457.89, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 478.75, "r_x1": 286.37, "r_y1": 478.75, "r_x2": 286.37, "r_y2": 469.84, "r_x3": 50.11, "r_y3": 469.84, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 490.7, "r_x1": 186.5, "r_y1": 490.7, "r_x2": 186.5, "r_y2": 481.8, "r_x3": 50.11, "r_y3": 481.8, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 493.69, "r": 286.37, "b": 622.27, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 502.65, "r_x1": 252.88, "r_y1": 502.65, "r_x2": 252.88, "r_y2": 493.69, "r_x3": 62.07, "r_y3": 493.69, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88, "r_y0": 502.71, "r_x1": 286.37, "r_y1": 502.71, "r_x2": 286.37, "r_y2": 493.81, "r_x3": 252.88, "r_y3": 493.81, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.67, "r_x1": 286.37, "r_y1": 514.67, "r_x2": 286.37, "r_y2": 505.76, "r_x3": 50.11, "r_y3": 505.76, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 526.62, "r_x1": 286.37, "r_y1": 526.62, "r_x2": 286.37, "r_y2": 517.72, "r_x3": 50.11, "r_y3": 517.72, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 538.58, "r_x1": 286.37, "r_y1": 538.58, "r_x2": 286.37, "r_y2": 529.67, "r_x3": 50.11, "r_y3": 529.67, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.54, "r_x1": 286.37, "r_y1": 550.54, "r_x2": 286.37, "r_y2": 541.63, "r_x3": 50.11, "r_y3": 541.63, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 562.49, "r_x1": 286.37, "r_y1": 562.49, "r_x2": 286.37, "r_y2": 553.58, "r_x3": 50.11, "r_y3": 553.58, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 574.45, "r_x1": 286.37, "r_y1": 574.45, "r_x2": 286.37, "r_y2": 565.54, "r_x3": 50.11, "r_y3": 565.54, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.4, "r_x1": 286.37, "r_y1": 586.4, "r_x2": 286.37, "r_y2": 577.49, "r_x3": 50.11, "r_y3": 577.49, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 598.36, "r_x1": 286.37, "r_y1": 598.36, "r_x2": 286.37, "r_y2": 589.45, "r_x3": 50.11, "r_y3": 589.45, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 610.31, "r_x1": 286.37, "r_y1": 610.31, "r_x2": 286.37, "r_y2": 601.4, "r_x3": 50.11, "r_y3": 601.4, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 622.27, "r_x1": 175.99, "r_y1": 622.27, "r_x2": 175.99, "r_y2": 613.36, "r_x3": 50.11, "r_y3": 613.36, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered." }, { "label": "section_header", "id": 8, "page_no": 2, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 50.11, "t": 635.94, "r": 105.23, "b": 646.69, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.69, "r_x1": 57.82, "r_y1": 646.69, "r_x2": 57.82, "r_y2": 635.94, "r_x3": 50.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.11, "r_y0": 646.69, "r_x1": 105.23, "r_y1": 646.69, "r_x2": 105.23, "r_y2": 635.94, "r_x3": 68.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Datasets" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 656.43, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 665.33, "r_x1": 286.36, "r_y1": 665.33, "r_x2": 286.36, "r_y2": 656.43, "r_x3": 62.07, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 166.25, "r_y1": 701.2, "r_x2": 166.25, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.69, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 173.69, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-" }, { "label": "picture", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 312.1, "t": 78.44, "r": 550.39, "b": 250.61, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.8, "t": 79.81, "r": 486.85, "b": 88.56, "coord_origin": "TOPLEFT" }, "confidence": 0.569, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.77, "t": 242.03, "r": 469.79, "b": 250.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.98, "t": 233.42, "r": 324.79, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.48, "t": 233.42, "r": 418.11, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.85, "t": 233.42, "r": 508.48, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.3, "t": 233.42, "r": 372.93, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.67, "t": 233.42, "r": 463.3, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.04, "t": 233.42, "r": 549.67, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04, "t": 230.45, "r": 319.86, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.63, "t": 198.69, "r": 316.44, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.44, "t": 198.69, "r": 320.26, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.15, "t": 168.1, "r": 316.97, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96, "t": 168.1, "r": 320.78, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.93, "t": 136.59, "r": 316.75, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74, "t": 136.59, "r": 320.56, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48, "t": 105.6, "r": 316.3, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.3, "t": 105.6, "r": 320.11, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48, "t": 212.26, "r": 316.3, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.3, "t": 212.26, "r": 320.11, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.08, "t": 183.72, "r": 316.89, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89, "t": 183.72, "r": 320.71, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76, "t": 152.47, "r": 316.58, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.58, "t": 152.47, "r": 320.39, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.2, "t": 120.57, "r": 316.01, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01, "t": 120.57, "r": 319.83, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.82, "t": 90.11, "r": 316.63, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63, "t": 90.11, "r": 320.45, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17, "t": 222.73, "r": 536.94, "b": 230.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.88, "t": 108.27, "r": 547.61, "b": 115.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.77, "t": 130.78, "r": 542.74, "b": 138.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.8, "t": 153.92, "r": 542.76, "b": 161.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.57, "t": 176.76, "r": 542.54, "b": 184.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.15, "t": 199.65, "r": 542.11, "b": 206.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 7, "page_no": 2, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 308.86, "t": 267.84, "r": 545.12, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 276.74, "r_x1": 346.06, "r_y1": 276.74, "r_x2": 346.06, "r_y2": 267.84, "r_x3": 308.86, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49, "r_y0": 276.74, "r_x1": 545.12, "r_y1": 276.74, "r_x2": 545.12, "r_y2": 267.84, "r_x3": 354.49, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 288.7, "r_x1": 498.57, "r_y1": 288.7, "r_x2": 498.57, "r_y2": 279.79, "r_x3": 308.86, "r_y3": 279.79, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets" }, { "label": "text", "id": 9, "page_no": 2, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 317.47, "r": 437.27, "b": 326.38, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 326.38, "r_x1": 437.27, "r_y1": 326.38, "r_x2": 437.27, "r_y2": 317.47, "r_x3": 308.86, "r_y3": 317.47, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "balance in the previous datasets." }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 331.53, "r": 545.12, "b": 627.36, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 340.44, "r_x1": 545.12, "r_y1": 340.44, "r_x2": 545.12, "r_y2": 331.53, "r_x3": 320.82, "r_y3": 331.53, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.39, "r_x1": 545.12, "r_y1": 352.39, "r_x2": 545.12, "r_y2": 343.49, "r_x3": 308.86, "r_y3": 343.49, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.35, "r_x1": 545.12, "r_y1": 364.35, "r_x2": 545.12, "r_y2": 355.44, "r_x3": 308.86, "r_y3": 355.44, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 376.3, "r_x1": 545.12, "r_y1": 376.3, "r_x2": 545.12, "r_y2": 367.4, "r_x3": 308.86, "r_y3": 367.4, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.26, "r_x1": 545.12, "r_y1": 388.26, "r_x2": 545.12, "r_y2": 379.35, "r_x3": 308.86, "r_y3": 379.35, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.21, "r_x1": 545.12, "r_y1": 400.21, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 308.86, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.26, "r_x3": 308.86, "r_y3": 403.26, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.12, "r_x1": 545.12, "r_y1": 424.12, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.17, "r_x3": 308.86, "r_y3": 427.17, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.03, "r_x1": 545.12, "r_y1": 448.03, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 545.12, "r_y1": 459.99, "r_x2": 545.12, "r_y2": 451.08, "r_x3": 308.86, "r_y3": 451.08, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 471.94, "r_x1": 545.12, "r_y1": 471.94, "r_x2": 545.12, "r_y2": 463.04, "r_x3": 308.86, "r_y3": 463.04, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 483.9, "r_x1": 545.12, "r_y1": 483.9, "r_x2": 545.12, "r_y2": 474.99, "r_x3": 308.86, "r_y3": 474.99, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 495.86, "r_x1": 545.12, "r_y1": 495.86, "r_x2": 545.12, "r_y2": 486.95, "r_x3": 308.86, "r_y3": 486.95, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 507.81, "r_x1": 545.12, "r_y1": 507.81, "r_x2": 545.12, "r_y2": 498.9, "r_x3": 308.86, "r_y3": 498.9, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 519.77, "r_x1": 545.12, "r_y1": 519.77, "r_x2": 545.12, "r_y2": 510.86, "r_x3": 308.86, "r_y3": 510.86, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 531.72, "r_x1": 545.12, "r_y1": 531.72, "r_x2": 545.12, "r_y2": 522.81, "r_x3": 308.86, "r_y3": 522.81, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 543.68, "r_x1": 545.12, "r_y1": 543.68, "r_x2": 545.12, "r_y2": 534.77, "r_x3": 308.86, "r_y3": 534.77, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.63, "r_x1": 545.12, "r_y1": 555.63, "r_x2": 545.12, "r_y2": 546.72, "r_x3": 308.86, "r_y3": 546.72, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.59, "r_x1": 545.12, "r_y1": 567.59, "r_x2": 545.12, "r_y2": 558.68, "r_x3": 308.86, "r_y3": 558.68, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 579.54, "r_x1": 545.12, "r_y1": 579.54, "r_x2": 545.12, "r_y2": 570.64, "r_x3": 308.86, "r_y3": 570.64, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 591.5, "r_x1": 545.11, "r_y1": 591.5, "r_x2": 545.11, "r_y2": 582.59, "r_x3": 308.86, "r_y3": 582.59, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 603.45, "r_x1": 545.12, "r_y1": 603.45, "r_x2": 545.12, "r_y2": 594.55, "r_x3": 308.86, "r_y3": 594.55, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 615.41, "r_x1": 545.12, "r_y1": 615.41, "r_x2": 545.12, "r_y2": 606.5, "r_x3": 308.86, "r_y3": 606.5, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 627.36, "r_x1": 348.16, "r_y1": 627.36, "r_x2": 348.16, "r_y2": 618.46, "r_x3": 308.86, "r_y3": 618.46, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits." }, { "label": "text", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 632.51, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 641.42, "r_x1": 545.11, "r_y1": 641.42, "r_x2": 545.11, "r_y2": 632.51, "r_x3": 320.82, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.42, "r_x3": 308.86, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small" }, { "label": "page_footer", "id": 11, "page_no": 2, "cluster": { "id": 11, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ], "body": [ { "label": "text", "id": 10, "page_no": 2, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 250.15, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 250.15, "r_y1": 84.11, "r_x2": 250.15, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tag-decoder which is constrained to the table-tags." }, { "label": "text", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 87.22, "r": 286.37, "b": 275.45, "coord_origin": "TOPLEFT" }, "confidence": 0.982, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.13, "r_x1": 70.37, "r_y1": 96.13, "r_x2": 70.37, "r_y2": 87.22, "r_x3": 62.07, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.93, "r_y0": 96.13, "r_x1": 110.95, "r_y1": 96.13, "r_x2": 110.95, "r_y2": 87.22, "r_x3": 76.93, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.54, "r_y0": 96.13, "r_x1": 136.26, "r_y1": 96.13, "r_x2": 136.26, "r_y2": 87.22, "r_x3": 118.54, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 142.82, "r_y0": 96.13, "r_x1": 175.37, "r_y1": 96.13, "r_x2": 175.37, "r_y2": 87.22, "r_x3": 142.82, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.95, "r_y0": 96.13, "r_x1": 232.84, "r_y1": 96.13, "r_x2": 232.84, "r_y2": 87.22, "r_x3": 181.95, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.41, "r_y0": 96.13, "r_x1": 265.41, "r_y1": 96.13, "r_x2": 265.41, "r_y2": 87.22, "r_x3": 239.41, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.98, "r_y0": 96.13, "r_x1": 286.36, "r_y1": 96.13, "r_x2": 286.36, "r_y2": 87.22, "r_x3": 271.98, "r_y3": 87.22, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.08, "r_x1": 286.37, "r_y1": 108.08, "r_x2": 286.37, "r_y2": 99.17, "r_x3": 50.11, "r_y3": 99.17, "coord_origin": "TOPLEFT" }, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 120.04, "r_x1": 286.37, "r_y1": 120.04, "r_x2": 286.37, "r_y2": 111.13, "r_x3": 50.11, "r_y3": 111.13, "coord_origin": "TOPLEFT" }, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.99, "r_x1": 286.37, "r_y1": 131.99, "r_x2": 286.37, "r_y2": 123.09, "r_x3": 50.11, "r_y3": 123.09, "coord_origin": "TOPLEFT" }, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.95, "r_x1": 286.37, "r_y1": 143.95, "r_x2": 286.37, "r_y2": 135.04, "r_x3": 50.11, "r_y3": 135.04, "coord_origin": "TOPLEFT" }, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.9, "r_x1": 286.37, "r_y1": 155.9, "r_x2": 286.37, "r_y2": 147.0, "r_x3": 50.11, "r_y3": 147.0, "coord_origin": "TOPLEFT" }, "text": "bedded in the content-decoder. This reliance on a custom,", "orig": "bedded in the content-decoder. This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 167.86, "r_x1": 286.37, "r_y1": 167.86, "r_x2": 286.37, "r_y2": 158.95, "r_x3": 50.11, "r_y3": 158.95, "coord_origin": "TOPLEFT" }, "text": "implicit OCR decoder is of course problematic. OCR is a", "orig": "implicit OCR decoder is of course problematic. OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 179.81, "r_x1": 286.37, "r_y1": 179.81, "r_x2": 286.37, "r_y2": 170.91, "r_x3": 50.11, "r_y3": 170.91, "coord_origin": "TOPLEFT" }, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 191.77, "r_x1": 286.37, "r_y1": 191.77, "r_x2": 286.37, "r_y2": 182.86, "r_x3": 50.11, "r_y3": 182.86, "coord_origin": "TOPLEFT" }, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 203.72, "r_x1": 286.37, "r_y1": 203.72, "r_x2": 286.37, "r_y2": 194.82, "r_x3": 50.11, "r_y3": 194.82, "coord_origin": "TOPLEFT" }, "text": "limited availability for non-english content in the current", "orig": "limited availability for non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 215.68, "r_x1": 286.37, "r_y1": 215.68, "r_x2": 286.37, "r_y2": 206.77, "r_x3": 50.11, "r_y3": 206.77, "coord_origin": "TOPLEFT" }, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 227.63, "r_x1": 286.37, "r_y1": 227.63, "r_x2": 286.37, "r_y2": 218.73, "r_x3": 50.11, "r_y3": 218.73, "coord_origin": "TOPLEFT" }, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 239.59, "r_x1": 286.37, "r_y1": 239.59, "r_x2": 286.37, "r_y2": 230.68, "r_x3": 50.11, "r_y3": 230.68, "coord_origin": "TOPLEFT" }, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 251.54, "r_x1": 286.37, "r_y1": 251.54, "r_x2": 286.37, "r_y2": 242.64, "r_x3": 50.11, "r_y3": 242.64, "coord_origin": "TOPLEFT" }, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 263.5, "r_x1": 286.37, "r_y1": 263.5, "r_x2": 286.37, "r_y2": 254.59, "r_x3": 50.11, "r_y3": 254.59, "coord_origin": "TOPLEFT" }, "text": "cell. The latter was the inspiration for the work of this pa-", "orig": "cell. The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 275.45, "r_x1": 64.78, "r_y1": 275.45, "r_x2": 64.78, "r_y2": 266.55, "r_x3": 50.11, "r_y3": 266.55, "coord_origin": "TOPLEFT" }, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 278.44, "r": 286.37, "b": 490.7, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 287.4, "r_x1": 171.57, "r_y1": 287.4, "r_x2": 171.57, "r_y2": 278.44, "r_x3": 62.07, "r_y3": 278.44, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.57, "r_y0": 287.47, "r_x1": 174.34, "r_y1": 287.47, "r_x2": 174.34, "r_y2": 278.56, "r_x3": 171.57, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.19, "r_y0": 287.47, "r_x1": 286.36, "r_y1": 287.47, "r_x2": 286.36, "r_y2": 278.56, "r_x3": 185.19, "r_y3": 278.56, "coord_origin": "TOPLEFT" }, "text": "Graph Neural networks", "orig": "Graph Neural networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 299.42, "r_x1": 286.37, "r_y1": 299.42, "r_x2": 286.37, "r_y2": 290.51, "r_x3": 50.11, "r_y3": 290.51, "coord_origin": "TOPLEFT" }, "text": "(GNN\u2019s) take a radically different approach to table-", "orig": "(GNN\u2019s) take a radically different approach to table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 311.38, "r_x1": 131.17, "r_y1": 311.38, "r_x2": 131.17, "r_y2": 302.47, "r_x3": 50.11, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "structure extraction.", "orig": "structure extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.85, "r_y0": 311.38, "r_x1": 286.37, "r_y1": 311.38, "r_x2": 286.37, "r_y2": 302.47, "r_x3": 138.85, "r_y3": 302.47, "coord_origin": "TOPLEFT" }, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.33, "r_x1": 286.37, "r_y1": 323.33, "r_x2": 286.37, "r_y2": 314.42, "r_x3": 50.11, "r_y3": 314.42, "coord_origin": "TOPLEFT" }, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.29, "r_x1": 286.37, "r_y1": 335.29, "r_x2": 286.37, "r_y2": 326.38, "r_x3": 50.11, "r_y3": 326.38, "coord_origin": "TOPLEFT" }, "text": "one creates an initial graph, where each of the text-cells", "orig": "one creates an initial graph, where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.24, "r_x1": 286.37, "r_y1": 347.24, "r_x2": 286.37, "r_y2": 338.33, "r_x3": 50.11, "r_y3": 338.33, "coord_origin": "TOPLEFT" }, "text": "becomes a node in the graph similar to [33, 34, 2]. Each", "orig": "becomes a node in the graph similar to [33, 34, 2]. Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.2, "r_x1": 286.37, "r_y1": 359.2, "r_x2": 286.37, "r_y2": 350.29, "r_x3": 50.11, "r_y3": 350.29, "coord_origin": "TOPLEFT" }, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.15, "r_x1": 286.37, "r_y1": 371.15, "r_x2": 286.37, "r_y2": 362.25, "r_x3": 50.11, "r_y3": 362.25, "coord_origin": "TOPLEFT" }, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.11, "r_x1": 286.37, "r_y1": 383.11, "r_x2": 286.37, "r_y2": 374.2, "r_x3": 50.11, "r_y3": 374.2, "coord_origin": "TOPLEFT" }, "text": "text. Furthermore, nodes that represent adjacent text-cells", "orig": "text. Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.06, "r_x1": 286.37, "r_y1": 395.06, "r_x2": 286.37, "r_y2": 386.16, "r_x3": 50.11, "r_y3": 386.16, "coord_origin": "TOPLEFT" }, "text": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 407.02, "r_x1": 286.37, "r_y1": 407.02, "r_x2": 286.37, "r_y2": 398.11, "r_x3": 50.11, "r_y3": 398.11, "coord_origin": "TOPLEFT" }, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 418.97, "r_x1": 286.37, "r_y1": 418.97, "r_x2": 286.37, "r_y2": 410.07, "r_x3": 50.11, "r_y3": 410.07, "coord_origin": "TOPLEFT" }, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 430.93, "r_x1": 286.37, "r_y1": 430.93, "r_x2": 286.37, "r_y2": 422.02, "r_x3": 50.11, "r_y3": 422.02, "coord_origin": "TOPLEFT" }, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 442.88, "r_x1": 198.24, "r_y1": 442.88, "r_x2": 198.24, "r_y2": 433.98, "r_x3": 50.11, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.93, "r_y0": 442.88, "r_x1": 286.37, "r_y1": 442.88, "r_x2": 286.37, "r_y2": 433.98, "r_x3": 205.93, "r_y3": 433.98, "coord_origin": "TOPLEFT" }, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 454.84, "r_x1": 286.37, "r_y1": 454.84, "r_x2": 286.37, "r_y2": 445.93, "r_x3": 50.11, "r_y3": 445.93, "coord_origin": "TOPLEFT" }, "text": "represent the table-structure. With this approach, one can", "orig": "represent the table-structure. With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 466.79, "r_x1": 286.37, "r_y1": 466.79, "r_x2": 286.37, "r_y2": 457.89, "r_x3": 50.11, "r_y3": 457.89, "coord_origin": "TOPLEFT" }, "text": "avoid the need to build custom OCR decoders. However,", "orig": "avoid the need to build custom OCR decoders. However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 478.75, "r_x1": 286.37, "r_y1": 478.75, "r_x2": 286.37, "r_y2": 469.84, "r_x3": 50.11, "r_y3": 469.84, "coord_origin": "TOPLEFT" }, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 490.7, "r_x1": 186.5, "r_y1": 490.7, "r_x2": 186.5, "r_y2": 481.8, "r_x3": 50.11, "r_y3": 481.8, "coord_origin": "TOPLEFT" }, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 493.69, "r": 286.37, "b": 622.27, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 502.65, "r_x1": 252.88, "r_y1": 502.65, "r_x2": 252.88, "r_y2": 493.69, "r_x3": 62.07, "r_y3": 493.69, "coord_origin": "TOPLEFT" }, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.88, "r_y0": 502.71, "r_x1": 286.37, "r_y1": 502.71, "r_x2": 286.37, "r_y2": 493.81, "r_x3": 252.88, "r_y3": 493.81, "coord_origin": "TOPLEFT" }, "text": ": A pop-", "orig": ": A pop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.67, "r_x1": 286.37, "r_y1": 514.67, "r_x2": 286.37, "r_y2": 505.76, "r_x3": 50.11, "r_y3": 505.76, "coord_origin": "TOPLEFT" }, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 526.62, "r_x1": 286.37, "r_y1": 526.62, "r_x2": 286.37, "r_y2": 517.72, "r_x3": 50.11, "r_y3": 517.72, "coord_origin": "TOPLEFT" }, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 538.58, "r_x1": 286.37, "r_y1": 538.58, "r_x2": 286.37, "r_y2": 529.67, "r_x3": 50.11, "r_y3": 529.67, "coord_origin": "TOPLEFT" }, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 550.54, "r_x1": 286.37, "r_y1": 550.54, "r_x2": 286.37, "r_y2": 541.63, "r_x3": 50.11, "r_y3": 541.63, "coord_origin": "TOPLEFT" }, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 562.49, "r_x1": 286.37, "r_y1": 562.49, "r_x2": 286.37, "r_y2": 553.58, "r_x3": 50.11, "r_y3": 553.58, "coord_origin": "TOPLEFT" }, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 574.45, "r_x1": 286.37, "r_y1": 574.45, "r_x2": 286.37, "r_y2": 565.54, "r_x3": 50.11, "r_y3": 565.54, "coord_origin": "TOPLEFT" }, "text": "its images) and finally uses different rule-sets to obtain", "orig": "its images) and finally uses different rule-sets to obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.4, "r_x1": 286.37, "r_y1": 586.4, "r_x2": 286.37, "r_y2": 577.49, "r_x3": 50.11, "r_y3": 577.49, "coord_origin": "TOPLEFT" }, "text": "its table-structure. Currently, this approach achieves state-", "orig": "its table-structure. Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 598.36, "r_x1": 286.37, "r_y1": 598.36, "r_x2": 286.37, "r_y2": 589.45, "r_x3": 50.11, "r_y3": 589.45, "coord_origin": "TOPLEFT" }, "text": "of-the-art results, but is not an end-to-end deep-learning", "orig": "of-the-art results, but is not an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 610.31, "r_x1": 286.37, "r_y1": 610.31, "r_x2": 286.37, "r_y2": 601.4, "r_x3": 50.11, "r_y3": 601.4, "coord_origin": "TOPLEFT" }, "text": "method. As such, new rules need to be written if different", "orig": "method. As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 622.27, "r_x1": 175.99, "r_y1": 622.27, "r_x2": 175.99, "r_y2": 613.36, "r_x3": 50.11, "r_y3": 613.36, "coord_origin": "TOPLEFT" }, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered." }, { "label": "section_header", "id": 8, "page_no": 2, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 50.11, "t": 635.94, "r": 105.23, "b": 646.69, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.69, "r_x1": 57.82, "r_y1": 646.69, "r_x2": 57.82, "r_y2": 635.94, "r_x3": 50.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.11, "r_y0": 646.69, "r_x1": 105.23, "r_y1": 646.69, "r_x2": 105.23, "r_y2": 635.94, "r_x3": 68.11, "r_y3": 635.94, "coord_origin": "TOPLEFT" }, "text": "Datasets", "orig": "Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Datasets" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 656.43, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 665.33, "r_x1": 286.36, "r_y1": 665.33, "r_x2": 286.36, "r_y2": 656.43, "r_x3": 62.07, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "evaluate our models. These datasets span over various ap-", "orig": "evaluate our models. These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 166.25, "r_y1": 701.2, "r_x2": 166.25, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.69, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 173.69, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-" }, { "label": "picture", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 312.1, "t": 78.44, "r": 550.39, "b": 250.61, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 12, "label": "section_header", "bbox": { "l": 380.8, "t": 79.81, "r": 486.85, "b": 88.56, "coord_origin": "TOPLEFT" }, "confidence": 0.569, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.8, "r_y0": 88.56, "r_x1": 486.85, "r_y1": 88.56, "r_x2": 486.85, "r_y2": 79.81, "r_x3": 380.8, "r_y3": 79.81, "coord_origin": "TOPLEFT" }, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 396.77, "t": 242.03, "r": 469.79, "b": 250.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.77, "r_y0": 250.77, "r_x1": 469.79, "r_y1": 250.77, "r_x2": 469.79, "r_y2": 242.03, "r_x3": 396.77, "r_y3": 242.03, "coord_origin": "TOPLEFT" }, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 320.98, "t": 233.42, "r": 324.79, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.98, "r_y0": 239.25, "r_x1": 324.79, "r_y1": 239.25, "r_x2": 324.79, "r_y2": 233.42, "r_x3": 320.98, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 410.48, "t": 233.42, "r": 418.11, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.48, "r_y0": 239.25, "r_x1": 418.11, "r_y1": 239.25, "r_x2": 418.11, "r_y2": 233.42, "r_x3": 410.48, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 500.85, "t": 233.42, "r": 508.48, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 500.85, "r_y0": 239.25, "r_x1": 508.48, "r_y1": 239.25, "r_x2": 508.48, "r_y2": 233.42, "r_x3": 500.85, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 365.3, "t": 233.42, "r": 372.93, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.3, "r_y0": 239.25, "r_x1": 372.93, "r_y1": 239.25, "r_x2": 372.93, "r_y2": 233.42, "r_x3": 365.3, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 455.67, "t": 233.42, "r": 463.3, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.67, "r_y0": 239.25, "r_x1": 463.3, "r_y1": 239.25, "r_x2": 463.3, "r_y2": 233.42, "r_x3": 455.67, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 542.04, "t": 233.42, "r": 549.67, "b": 239.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 542.04, "r_y0": 239.25, "r_x1": 549.67, "r_y1": 239.25, "r_x2": 549.67, "r_y2": 233.42, "r_x3": 542.04, "r_y3": 233.42, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 316.04, "t": 230.45, "r": 319.86, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.04, "r_y0": 236.28, "r_x1": 319.86, "r_y1": 236.28, "r_x2": 319.86, "r_y2": 230.45, "r_x3": 316.04, "r_y3": 230.45, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 312.63, "t": 198.69, "r": 316.44, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.63, "r_y0": 204.52, "r_x1": 316.44, "r_y1": 204.52, "r_x2": 316.44, "r_y2": 198.69, "r_x3": 312.63, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 316.44, "t": 198.69, "r": 320.26, "b": 204.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.44, "r_y0": 204.52, "r_x1": 320.26, "r_y1": 204.52, "r_x2": 320.26, "r_y2": 198.69, "r_x3": 316.44, "r_y3": 198.69, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 313.15, "t": 168.1, "r": 316.97, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.15, "r_y0": 173.93, "r_x1": 316.97, "r_y1": 173.93, "r_x2": 316.97, "r_y2": 168.1, "r_x3": 313.15, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 316.96, "t": 168.1, "r": 320.78, "b": 173.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.96, "r_y0": 173.93, "r_x1": 320.78, "r_y1": 173.93, "r_x2": 320.78, "r_y2": 168.1, "r_x3": 316.96, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 312.93, "t": 136.59, "r": 316.75, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.93, "r_y0": 142.42, "r_x1": 316.75, "r_y1": 142.42, "r_x2": 316.75, "r_y2": 136.59, "r_x3": 312.93, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 316.74, "t": 136.59, "r": 320.56, "b": 142.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.74, "r_y0": 142.42, "r_x1": 320.56, "r_y1": 142.42, "r_x2": 320.56, "r_y2": 136.59, "r_x3": 316.74, "r_y3": 136.59, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 312.48, "t": 105.6, "r": 316.3, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 111.43, "r_x1": 316.3, "r_y1": 111.43, "r_x2": 316.3, "r_y2": 105.6, "r_x3": 312.48, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 316.3, "t": 105.6, "r": 320.11, "b": 111.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 111.43, "r_x1": 320.11, "r_y1": 111.43, "r_x2": 320.11, "r_y2": 105.6, "r_x3": 316.3, "r_y3": 105.6, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 312.48, "t": 212.26, "r": 316.3, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.48, "r_y0": 218.09, "r_x1": 316.3, "r_y1": 218.09, "r_x2": 316.3, "r_y2": 212.26, "r_x3": 312.48, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 316.3, "t": 212.26, "r": 320.11, "b": 218.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.3, "r_y0": 218.09, "r_x1": 320.11, "r_y1": 218.09, "r_x2": 320.11, "r_y2": 212.26, "r_x3": 316.3, "r_y3": 212.26, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 313.08, "t": 183.72, "r": 316.89, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.08, "r_y0": 189.55, "r_x1": 316.89, "r_y1": 189.55, "r_x2": 316.89, "r_y2": 183.72, "r_x3": 313.08, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 316.89, "t": 183.72, "r": 320.71, "b": 189.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.89, "r_y0": 189.55, "r_x1": 320.71, "r_y1": 189.55, "r_x2": 320.71, "r_y2": 183.72, "r_x3": 316.89, "r_y3": 183.72, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 312.76, "t": 152.47, "r": 316.58, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.76, "r_y0": 158.31, "r_x1": 316.58, "r_y1": 158.31, "r_x2": 316.58, "r_y2": 152.47, "r_x3": 312.76, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 316.58, "t": 152.47, "r": 320.39, "b": 158.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.58, "r_y0": 158.31, "r_x1": 320.39, "r_y1": 158.31, "r_x2": 320.39, "r_y2": 152.47, "r_x3": 316.58, "r_y3": 152.47, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 312.2, "t": 120.57, "r": 316.01, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.2, "r_y0": 126.4, "r_x1": 316.01, "r_y1": 126.4, "r_x2": 316.01, "r_y2": 120.57, "r_x3": 312.2, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 316.01, "t": 120.57, "r": 319.83, "b": 126.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.01, "r_y0": 126.4, "r_x1": 319.83, "r_y1": 126.4, "r_x2": 319.83, "r_y2": 120.57, "r_x3": 316.01, "r_y3": 120.57, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 312.82, "t": 90.11, "r": 316.63, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 95.94, "r_x1": 316.63, "r_y1": 95.94, "r_x2": 316.63, "r_y2": 90.11, "r_x3": 312.82, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 316.63, "t": 90.11, "r": 320.45, "b": 95.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.63, "r_y0": 95.94, "r_x1": 320.45, "r_y1": 95.94, "r_x2": 320.45, "r_y2": 90.11, "r_x3": 316.63, "r_y3": 90.11, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 532.17, "t": 222.73, "r": 536.94, "b": 230.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.17, "r_y0": 230.02, "r_x1": 536.94, "r_y1": 230.02, "r_x2": 536.94, "r_y2": 222.73, "r_x3": 532.17, "r_y3": 222.73, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 532.88, "t": 108.27, "r": 547.61, "b": 115.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.88, "r_y0": 115.56, "r_x1": 547.61, "r_y1": 115.56, "r_x2": 547.61, "r_y2": 108.27, "r_x3": 532.88, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 532.77, "t": 130.78, "r": 542.74, "b": 138.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.77, "r_y0": 138.07, "r_x1": 542.74, "r_y1": 138.07, "r_x2": 542.74, "r_y2": 130.78, "r_x3": 532.77, "r_y3": 130.78, "coord_origin": "TOPLEFT" }, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 532.8, "t": 153.92, "r": 542.76, "b": 161.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.8, "r_y0": 161.21, "r_x1": 542.76, "r_y1": 161.21, "r_x2": 542.76, "r_y2": 153.92, "r_x3": 532.8, "r_y3": 153.92, "coord_origin": "TOPLEFT" }, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 532.57, "t": 176.76, "r": 542.54, "b": 184.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.57, "r_y0": 184.05, "r_x1": 542.54, "r_y1": 184.05, "r_x2": 542.54, "r_y2": 176.76, "r_x3": 532.57, "r_y3": 176.76, "coord_origin": "TOPLEFT" }, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 532.15, "t": 199.65, "r": 542.11, "b": 206.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.15, "r_y0": 206.94, "r_x1": 542.11, "r_y1": 206.94, "r_x2": 542.11, "r_y2": 199.65, "r_x3": 532.15, "r_y3": 199.65, "coord_origin": "TOPLEFT" }, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 7, "page_no": 2, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 308.86, "t": 267.84, "r": 545.12, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 276.74, "r_x1": 346.06, "r_y1": 276.74, "r_x2": 346.06, "r_y2": 267.84, "r_x3": 308.86, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.49, "r_y0": 276.74, "r_x1": 545.12, "r_y1": 276.74, "r_x2": 545.12, "r_y2": 267.84, "r_x3": 354.49, "r_y3": 267.84, "coord_origin": "TOPLEFT" }, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 288.7, "r_x1": 498.57, "r_y1": 288.7, "r_x2": 498.57, "r_y2": 279.79, "r_x3": 308.86, "r_y3": 279.79, "coord_origin": "TOPLEFT" }, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets" }, { "label": "text", "id": 9, "page_no": 2, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 317.47, "r": 437.27, "b": 326.38, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 326.38, "r_x1": 437.27, "r_y1": 326.38, "r_x2": 437.27, "r_y2": 317.47, "r_x3": 308.86, "r_y3": 317.47, "coord_origin": "TOPLEFT" }, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "balance in the previous datasets." }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 331.53, "r": 545.12, "b": 627.36, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 340.44, "r_x1": 545.12, "r_y1": 340.44, "r_x2": 545.12, "r_y2": 331.53, "r_x3": 320.82, "r_y3": 331.53, "coord_origin": "TOPLEFT" }, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.39, "r_x1": 545.12, "r_y1": 352.39, "r_x2": 545.12, "r_y2": 343.49, "r_x3": 308.86, "r_y3": 343.49, "coord_origin": "TOPLEFT" }, "text": "annotated PNG images. The annotations consist of the table", "orig": "annotated PNG images. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.35, "r_x1": 545.12, "r_y1": 364.35, "r_x2": 545.12, "r_y2": 355.44, "r_x3": 308.86, "r_y3": 355.44, "coord_origin": "TOPLEFT" }, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 376.3, "r_x1": 545.12, "r_y1": 376.3, "r_x2": 545.12, "r_y2": 367.4, "r_x3": 308.86, "r_y3": 367.4, "coord_origin": "TOPLEFT" }, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.26, "r_x1": 545.12, "r_y1": 388.26, "r_x2": 545.12, "r_y2": 379.35, "r_x3": 308.86, "r_y3": 379.35, "coord_origin": "TOPLEFT" }, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.21, "r_x1": 545.12, "r_y1": 400.21, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 308.86, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "a table is characterized as \u201csimple\u201d when it does not contain", "orig": "a table is characterized as \u201csimple\u201d when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.26, "r_x3": 308.86, "r_y3": 403.26, "coord_origin": "TOPLEFT" }, "text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.12, "r_x1": 545.12, "r_y1": 424.12, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "dataset is divided into Train and Val splits (roughly 98% and", "orig": "dataset is divided into Train and Val splits (roughly 98% and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.17, "r_x3": 308.86, "r_y3": 427.17, "coord_origin": "TOPLEFT" }, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.03, "r_x1": 545.12, "r_y1": 448.03, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 545.12, "r_y1": 459.99, "r_x2": 545.12, "r_y2": 451.08, "r_x3": 308.86, "r_y3": 451.08, "coord_origin": "TOPLEFT" }, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 471.94, "r_x1": 545.12, "r_y1": 471.94, "r_x2": 545.12, "r_y2": 463.04, "r_x3": 308.86, "r_y3": 463.04, "coord_origin": "TOPLEFT" }, "text": "single-page PDF documents with mixed table structures and", "orig": "single-page PDF documents with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 483.9, "r_x1": 545.12, "r_y1": 483.9, "r_x2": 545.12, "r_y2": 474.99, "r_x3": 308.86, "r_y3": 474.99, "coord_origin": "TOPLEFT" }, "text": "text content. Similarly to the PubTabNet, the annotations", "orig": "text content. Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 495.86, "r_x1": 545.12, "r_y1": 495.86, "r_x2": 545.12, "r_y2": 486.95, "r_x3": 308.86, "r_y3": 486.95, "coord_origin": "TOPLEFT" }, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 507.81, "r_x1": 545.12, "r_y1": 507.81, "r_x2": 545.12, "r_y2": 498.9, "r_x3": 308.86, "r_y3": 498.9, "coord_origin": "TOPLEFT" }, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 519.77, "r_x1": 545.12, "r_y1": 519.77, "r_x2": 545.12, "r_y2": 510.86, "r_x3": 308.86, "r_y3": 510.86, "coord_origin": "TOPLEFT" }, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 531.72, "r_x1": 545.12, "r_y1": 531.72, "r_x2": 545.12, "r_y2": 522.81, "r_x3": 308.86, "r_y3": 522.81, "coord_origin": "TOPLEFT" }, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 543.68, "r_x1": 545.12, "r_y1": 543.68, "r_x2": 545.12, "r_y2": 534.77, "r_x3": 308.86, "r_y3": 534.77, "coord_origin": "TOPLEFT" }, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.63, "r_x1": 545.12, "r_y1": 555.63, "r_x2": 545.12, "r_y2": 546.72, "r_x3": 308.86, "r_y3": 546.72, "coord_origin": "TOPLEFT" }, "text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.59, "r_x1": 545.12, "r_y1": 567.59, "r_x2": 545.12, "r_y2": 558.68, "r_x3": 308.86, "r_y3": 558.68, "coord_origin": "TOPLEFT" }, "text": "47% complex). Finally the TableBank dataset consists of", "orig": "47% complex). Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 579.54, "r_x1": 545.12, "r_y1": 579.54, "r_x2": 545.12, "r_y2": 570.64, "r_x3": 308.86, "r_y3": 570.64, "coord_origin": "TOPLEFT" }, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 591.5, "r_x1": 545.11, "r_y1": 591.5, "r_x2": 545.11, "r_y2": 582.59, "r_x3": 308.86, "r_y3": 582.59, "coord_origin": "TOPLEFT" }, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 603.45, "r_x1": 545.12, "r_y1": 603.45, "r_x2": 545.12, "r_y2": 594.55, "r_x3": 308.86, "r_y3": 594.55, "coord_origin": "TOPLEFT" }, "text": "boxes of the table cells. The entire dataset consists of sim-", "orig": "boxes of the table cells. The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 615.41, "r_x1": 545.12, "r_y1": 615.41, "r_x2": 545.12, "r_y2": 606.5, "r_x3": 308.86, "r_y3": 606.5, "coord_origin": "TOPLEFT" }, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 627.36, "r_x1": 348.16, "r_y1": 627.36, "r_x2": 348.16, "r_y2": 618.46, "r_x3": 308.86, "r_y3": 618.46, "coord_origin": "TOPLEFT" }, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits." }, { "label": "text", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 632.51, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 641.42, "r_x1": 545.11, "r_y1": 641.42, "r_x2": 545.11, "r_y2": 632.51, "r_x3": 320.82, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.38, "r_x1": 545.12, "r_y1": 653.38, "r_x2": 545.12, "r_y2": 644.47, "r_x3": 308.86, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.33, "r_x1": 545.12, "r_y1": 665.33, "r_x2": 545.12, "r_y2": 656.42, "r_x3": 308.86, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "cal purposes. Given the size of PubTabNet, we adopted its", "orig": "cal purposes. Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "as PNG images with a resolution of 72 dpi. Additionally,", "orig": "as PNG images with a resolution of 72 dpi. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small" } ], "headers": [ { "label": "page_footer", "id": 11, "page_no": 2, "cluster": { "id": 11, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ] } }, { "page_no": 3, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 212.28, "r_y1": 96.07, "r_x2": 212.28, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 109.87, "r_x1": 286.37, "r_y1": 109.87, "r_x2": 286.37, "r_y2": 100.96, "r_x3": 62.07, "r_y3": 100.96, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 121.82, "r_x1": 286.37, "r_y1": 121.82, "r_x2": 286.37, "r_y2": 112.92, "r_x3": 50.11, "r_y3": 112.92, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 133.78, "r_x1": 286.37, "r_y1": 133.78, "r_x2": 286.37, "r_y2": 124.87, "r_x3": 50.11, "r_y3": 124.87, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 145.73, "r_x1": 286.37, "r_y1": 145.73, "r_x2": 286.37, "r_y2": 136.83, "r_x3": 50.11, "r_y3": 136.83, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 157.69, "r_x1": 286.37, "r_y1": 157.69, "r_x2": 286.37, "r_y2": 148.78, "r_x3": 50.11, "r_y3": 148.78, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 169.64, "r_x1": 286.37, "r_y1": 169.64, "r_x2": 286.37, "r_y2": 160.74, "r_x3": 50.11, "r_y3": 160.74, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 181.6, "r_x1": 286.37, "r_y1": 181.6, "r_x2": 286.37, "r_y2": 172.69, "r_x3": 50.11, "r_y3": 172.69, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 193.55, "r_x1": 286.37, "r_y1": 193.55, "r_x2": 286.37, "r_y2": 184.65, "r_x3": 50.11, "r_y3": 184.65, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 205.51, "r_x1": 286.37, "r_y1": 205.51, "r_x2": 286.37, "r_y2": 196.6, "r_x3": 50.11, "r_y3": 196.6, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 217.46, "r_x1": 286.37, "r_y1": 217.46, "r_x2": 286.37, "r_y2": 208.56, "r_x3": 50.11, "r_y3": 208.56, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 229.42, "r_x1": 286.37, "r_y1": 229.42, "r_x2": 286.37, "r_y2": 220.51, "r_x3": 50.11, "r_y3": 220.51, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 241.37, "r_x1": 286.37, "r_y1": 241.37, "r_x2": 286.37, "r_y2": 232.47, "r_x3": 50.11, "r_y3": 232.47, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 253.33, "r_x1": 286.37, "r_y1": 253.33, "r_x2": 286.37, "r_y2": 244.42, "r_x3": 50.11, "r_y3": 244.42, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 265.28, "r_x1": 286.37, "r_y1": 265.28, "r_x2": 286.37, "r_y2": 256.38, "r_x3": 50.11, "r_y3": 256.38, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 277.24, "r_x1": 286.37, "r_y1": 277.24, "r_x2": 286.37, "r_y2": 268.33, "r_x3": 50.11, "r_y3": 268.33, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 289.2, "r_x1": 68.65, "r_y1": 289.2, "r_x2": 68.65, "r_y2": 280.29, "r_x3": 50.11, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.57, "r_y0": 289.2, "r_x1": 286.37, "r_y1": 289.2, "r_x2": 286.37, "r_y2": 280.29, "r_x3": 75.57, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 301.15, "r_x1": 286.37, "r_y1": 301.15, "r_x2": 286.37, "r_y2": 292.24, "r_x3": 50.11, "r_y3": 292.24, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 313.11, "r_x1": 75.7, "r_y1": 313.11, "r_x2": 75.7, "r_y2": 304.2, "r_x3": 50.11, "r_y3": 304.2, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 326.9, "r_x1": 286.36, "r_y1": 326.9, "r_x2": 286.36, "r_y2": 318.0, "r_x3": 62.07, "r_y3": 318.0, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 338.86, "r_x1": 286.37, "r_y1": 338.86, "r_x2": 286.37, "r_y2": 329.95, "r_x3": 50.11, "r_y3": 329.95, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 350.81, "r_x1": 286.37, "r_y1": 350.81, "r_x2": 286.37, "r_y2": 341.91, "r_x3": 50.11, "r_y3": 341.91, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 362.77, "r_x1": 286.37, "r_y1": 362.77, "r_x2": 286.37, "r_y2": 353.86, "r_x3": 50.11, "r_y3": 353.86, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 374.72, "r_x1": 286.37, "r_y1": 374.72, "r_x2": 286.37, "r_y2": 365.82, "r_x3": 50.11, "r_y3": 365.82, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 386.68, "r_x1": 141.59, "r_y1": 386.68, "r_x2": 141.59, "r_y2": 377.77, "r_x3": 50.11, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.7, "r_y0": 386.68, "r_x1": 286.37, "r_y1": 386.68, "r_x2": 286.37, "r_y2": 377.77, "r_x3": 148.7, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 398.63, "r_x1": 286.37, "r_y1": 398.63, "r_x2": 286.37, "r_y2": 389.73, "r_x3": 50.11, "r_y3": 389.73, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 410.59, "r_x1": 286.37, "r_y1": 410.59, "r_x2": 286.37, "r_y2": 401.68, "r_x3": 50.11, "r_y3": 401.68, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 422.54, "r_x1": 286.37, "r_y1": 422.54, "r_x2": 286.37, "r_y2": 413.64, "r_x3": 50.11, "r_y3": 413.64, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 434.5, "r_x1": 216.4, "r_y1": 434.5, "r_x2": 216.4, "r_y2": 425.59, "r_x3": 50.11, "r_y3": 425.59, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 448.3, "r_x1": 286.36, "r_y1": 448.3, "r_x2": 286.36, "r_y2": 439.39, "r_x3": 62.07, "r_y3": 439.39, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.25, "r_x1": 172.14, "r_y1": 460.25, "r_x2": 172.14, "r_y2": 451.34, "r_x3": 50.11, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.15, "r_y0": 460.02, "r_x1": 224.71, "r_y1": 460.02, "r_x2": 224.71, "r_y2": 451.43, "r_x3": 174.15, "r_y3": 451.43, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.71, "r_y0": 460.25, "r_x1": 286.37, "r_y1": 460.25, "r_x2": 286.37, "r_y2": 451.34, "r_x3": 224.71, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.21, "r_x1": 286.37, "r_y1": 472.21, "r_x2": 286.37, "r_y2": 463.3, "r_x3": 50.11, "r_y3": 463.3, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.16, "r_x1": 286.37, "r_y1": 484.16, "r_x2": 286.37, "r_y2": 475.26, "r_x3": 50.11, "r_y3": 475.26, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 496.12, "r_x1": 286.37, "r_y1": 496.12, "r_x2": 286.37, "r_y2": 487.21, "r_x3": 50.11, "r_y3": 487.21, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 508.07, "r_x1": 286.37, "r_y1": 508.07, "r_x2": 286.37, "r_y2": 499.17, "r_x3": 50.11, "r_y3": 499.17, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 520.03, "r_x1": 286.37, "r_y1": 520.03, "r_x2": 286.37, "r_y2": 511.12, "r_x3": 50.11, "r_y3": 511.12, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.98, "r_x1": 286.37, "r_y1": 531.98, "r_x2": 286.37, "r_y2": 523.08, "r_x3": 50.11, "r_y3": 523.08, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.94, "r_x1": 286.37, "r_y1": 543.94, "r_x2": 286.37, "r_y2": 535.03, "r_x3": 50.11, "r_y3": 535.03, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.89, "r_x1": 286.37, "r_y1": 555.89, "r_x2": 286.37, "r_y2": 546.99, "r_x3": 50.11, "r_y3": 546.99, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.85, "r_x1": 286.37, "r_y1": 567.85, "r_x2": 286.37, "r_y2": 558.94, "r_x3": 50.11, "r_y3": 558.94, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.8, "r_x1": 286.37, "r_y1": 579.8, "r_x2": 286.37, "r_y2": 570.9, "r_x3": 50.11, "r_y3": 570.9, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.76, "r_x1": 286.37, "r_y1": 591.76, "r_x2": 286.37, "r_y2": 582.85, "r_x3": 50.11, "r_y3": 582.85, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.71, "r_x1": 286.37, "r_y1": 603.71, "r_x2": 286.37, "r_y2": 594.81, "r_x3": 50.11, "r_y3": 594.81, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.67, "r_x1": 286.37, "r_y1": 615.67, "r_x2": 286.37, "r_y2": 606.76, "r_x3": 50.11, "r_y3": 606.76, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.62, "r_x1": 209.75, "r_y1": 627.62, "r_x2": 209.75, "r_y2": 618.72, "r_x3": 50.11, "r_y3": 618.72, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 641.42, "r_x1": 286.36, "r_y1": 641.42, "r_x2": 286.36, "r_y2": 632.51, "r_x3": 62.07, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.43, "r_x3": 50.11, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 176.57, "r_x1": 344.62, "r_y1": 176.57, "r_x2": 344.62, "r_y2": 167.66, "r_x3": 308.86, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.08, "r_y0": 176.57, "r_x1": 380.45, "r_y1": 176.57, "r_x2": 380.45, "r_y2": 167.66, "r_x3": 361.08, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.57, "r_y0": 176.34, "r_x1": 468.68, "r_y1": 176.34, "r_x2": 468.68, "r_y2": 167.75, "r_x3": 386.57, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.8, "r_y0": 176.57, "r_x1": 489.18, "r_y1": 176.57, "r_x2": 489.18, "r_y2": 167.66, "r_x3": 474.8, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.3, "r_y0": 176.34, "r_x1": 545.11, "r_y1": 176.34, "r_x2": 545.11, "r_y2": 167.75, "r_x3": 495.3, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 188.29, "r_x1": 341.16, "r_y1": 188.29, "r_x2": 341.16, "r_y2": 179.71, "r_x3": 308.86, "r_y3": 179.71, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.46, "r_y0": 188.52, "r_x1": 545.11, "r_y1": 188.52, "r_x2": 545.11, "r_y2": 179.62, "r_x3": 343.46, "r_y3": 179.62, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 200.48, "r_x1": 545.12, "r_y1": 200.48, "r_x2": 545.12, "r_y2": 191.57, "r_x3": 308.86, "r_y3": 191.57, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 212.43, "r_x1": 545.11, "r_y1": 212.43, "r_x2": 545.11, "r_y2": 203.53, "r_x3": 308.86, "r_y3": 203.53, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 224.39, "r_x1": 523.93, "r_y1": 224.39, "r_x2": 523.93, "r_y2": 215.48, "r_x3": 308.86, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.53, "r_x1": 545.12, "r_y1": 258.53, "r_x2": 545.12, "r_y2": 249.62, "r_x3": 308.86, "r_y3": 249.62, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.48, "r_x1": 545.12, "r_y1": 270.48, "r_x2": 545.12, "r_y2": 261.58, "r_x3": 308.86, "r_y3": 261.58, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.44, "r_x1": 545.12, "r_y1": 282.44, "r_x2": 545.12, "r_y2": 273.53, "r_x3": 308.86, "r_y3": 273.53, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.39, "r_x1": 436.82, "r_y1": 294.39, "r_x2": 436.82, "r_y2": 285.49, "r_x3": 308.86, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.68, "r_x1": 542.74, "r_y1": 306.68, "r_x2": 542.74, "r_y2": 297.77, "r_x3": 320.82, "r_y3": 297.77, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 331.93, "r_x1": 316.28, "r_y1": 331.93, "r_x2": 316.28, "r_y2": 321.18, "r_x3": 308.86, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18, "r_y0": 331.93, "r_x1": 444.94, "r_y1": 331.93, "r_x2": 444.94, "r_y2": 321.18, "r_x3": 326.18, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 350.85, "r_x1": 545.11, "r_y1": 350.85, "r_x2": 545.11, "r_y2": 341.94, "r_x3": 320.82, "r_y3": 341.94, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 362.8, "r_x1": 545.12, "r_y1": 362.8, "r_x2": 545.12, "r_y2": 353.89, "r_x3": 308.86, "r_y3": 353.89, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 374.76, "r_x1": 545.12, "r_y1": 374.76, "r_x2": 545.12, "r_y2": 365.85, "r_x3": 308.86, "r_y3": 365.85, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 386.71, "r_x1": 545.12, "r_y1": 386.71, "r_x2": 545.12, "r_y2": 377.8, "r_x3": 308.86, "r_y3": 377.8, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 398.67, "r_x1": 545.12, "r_y1": 398.67, "r_x2": 545.12, "r_y2": 389.76, "r_x3": 308.86, "r_y3": 389.76, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 410.62, "r_x1": 545.12, "r_y1": 410.62, "r_x2": 545.12, "r_y2": 401.71, "r_x3": 308.86, "r_y3": 401.71, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 422.58, "r_x1": 545.12, "r_y1": 422.58, "r_x2": 545.12, "r_y2": 413.67, "r_x3": 308.86, "r_y3": 413.67, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 434.53, "r_x1": 545.12, "r_y1": 434.53, "r_x2": 545.12, "r_y2": 425.63, "r_x3": 308.86, "r_y3": 425.63, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 446.49, "r_x1": 437.94, "r_y1": 446.49, "r_x2": 437.94, "r_y2": 437.58, "r_x3": 308.86, "r_y3": 437.58, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 467.55, "r_x1": 323.14, "r_y1": 467.55, "r_x2": 323.14, "r_y2": 457.69, "r_x3": 308.86, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66, "r_y0": 467.55, "r_x1": 420.16, "r_y1": 467.55, "r_x2": 420.16, "r_y2": 457.69, "r_x3": 332.66, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 485.67, "r_x1": 545.11, "r_y1": 485.67, "r_x2": 545.11, "r_y2": 476.77, "r_x3": 320.82, "r_y3": 476.77, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.63, "r_x1": 509.02, "r_y1": 497.63, "r_x2": 509.02, "r_y2": 488.72, "r_x3": 308.86, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.59, "r_y0": 497.63, "r_x1": 523.06, "r_y1": 497.63, "r_x2": 523.06, "r_y2": 488.72, "r_x3": 515.59, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.63, "r_x1": 545.12, "r_y1": 497.63, "r_x2": 545.12, "r_y2": 488.72, "r_x3": 529.62, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.35, "r_x1": 406.35, "r_y1": 509.35, "r_x2": 406.35, "r_y2": 500.76, "r_x3": 308.86, "r_y3": 500.76, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87, "r_y0": 509.58, "r_x1": 545.11, "r_y1": 509.58, "r_x2": 545.11, "r_y2": 500.68, "r_x3": 408.87, "r_y3": 500.68, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.54, "r_x1": 409.39, "r_y1": 521.54, "r_x2": 409.39, "r_y2": 512.63, "r_x3": 308.86, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.73, "r_y0": 521.54, "r_x1": 545.12, "r_y1": 521.54, "r_x2": 545.12, "r_y2": 512.63, "r_x3": 416.73, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.49, "r_x1": 436.19, "r_y1": 533.49, "r_x2": 436.19, "r_y2": 524.59, "r_x3": 308.86, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 533.26, "r_x1": 513.87, "r_y1": 533.26, "r_x2": 513.87, "r_y2": 524.68, "r_x3": 439.53, "r_y3": 524.68, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43, "r_y0": 533.49, "r_x1": 545.11, "r_y1": 533.49, "r_x2": 545.11, "r_y2": 524.59, "r_x3": 517.43, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.45, "r_x1": 545.12, "r_y1": 545.45, "r_x2": 545.12, "r_y2": 536.54, "r_x3": 308.86, "r_y3": 536.54, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.4, "r_x1": 358.55, "r_y1": 557.4, "r_x2": 358.55, "r_y2": 548.5, "r_x3": 308.86, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19, "r_y0": 557.4, "r_x1": 545.12, "r_y1": 557.4, "r_x2": 545.12, "r_y2": 548.5, "r_x3": 365.19, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.36, "r_x1": 352.41, "r_y1": 569.36, "r_x2": 352.41, "r_y2": 560.45, "r_x3": 308.86, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.41, "r_y0": 569.14, "r_x1": 360.16, "r_y1": 569.14, "r_x2": 360.16, "r_y2": 560.29, "r_x3": 352.41, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.16, "r_y0": 569.36, "r_x1": 367.91, "r_y1": 569.36, "r_x2": 367.91, "r_y2": 560.45, "r_x3": 360.16, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.91, "r_y0": 569.14, "r_x1": 375.66, "r_y1": 569.14, "r_x2": 375.66, "r_y2": 560.29, "r_x3": 367.91, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.66, "r_y0": 569.36, "r_x1": 545.11, "r_y1": 569.36, "r_x2": 545.11, "r_y2": 560.45, "r_x3": 375.66, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.31, "r_x1": 545.11, "r_y1": 581.31, "r_x2": 545.11, "r_y2": 572.41, "r_x3": 308.86, "r_y3": 572.41, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.27, "r_x1": 483.12, "r_y1": 593.27, "r_x2": 483.12, "r_y2": 584.36, "r_x3": 308.86, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 593.05, "r_x1": 490.87, "r_y1": 593.05, "r_x2": 490.87, "r_y2": 584.2, "r_x3": 483.12, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.87, "r_y0": 593.27, "r_x1": 545.11, "r_y1": 593.27, "r_x2": 545.11, "r_y2": 584.36, "r_x3": 490.87, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.22, "r_x1": 545.11, "r_y1": 605.22, "r_x2": 545.11, "r_y2": 596.32, "r_x3": 308.86, "r_y3": 596.32, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.18, "r_x1": 329.64, "r_y1": 617.18, "r_x2": 329.64, "r_y2": 608.27, "r_x3": 308.86, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.65, "r_y0": 616.96, "r_x1": 337.39, "r_y1": 616.96, "r_x2": 337.39, "r_y2": 608.11, "r_x3": 329.65, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39, "r_y0": 617.18, "r_x1": 468.59, "r_y1": 617.18, "r_x2": 468.59, "r_y2": 608.27, "r_x3": 337.39, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59, "r_y0": 616.96, "r_x1": 476.34, "r_y1": 616.96, "r_x2": 476.34, "r_y2": 608.11, "r_x3": 468.59, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.34, "r_y0": 617.18, "r_x1": 545.12, "r_y1": 617.18, "r_x2": 545.12, "r_y2": 608.27, "r_x3": 476.34, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.13, "r_x1": 545.11, "r_y1": 629.13, "r_x2": 545.11, "r_y2": 620.23, "r_x3": 308.86, "r_y3": 620.23, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.09, "r_x1": 545.12, "r_y1": 641.09, "r_x2": 545.12, "r_y2": 632.18, "r_x3": 308.86, "r_y3": 632.18, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.04, "r_x1": 545.12, "r_y1": 653.04, "r_x2": 545.12, "r_y2": 644.14, "r_x3": 308.86, "r_y3": 644.14, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.0, "r_x1": 449.42, "r_y1": 665.0, "r_x2": 449.42, "r_y2": 656.09, "r_x3": 308.86, "r_y3": 656.09, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.22, "r_x1": 431.91, "r_y1": 677.22, "r_x2": 431.91, "r_y2": 668.26, "r_x3": 320.82, "r_y3": 668.26, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 439.5, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.11, "r_y1": 689.24, "r_x2": 545.11, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 212.28, "r_y1": 96.07, "r_x2": 212.28, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 100.96, "r": 286.37, "b": 313.11, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 109.87, "r_x1": 286.37, "r_y1": 109.87, "r_x2": 286.37, "r_y2": 100.96, "r_x3": 62.07, "r_y3": 100.96, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 121.82, "r_x1": 286.37, "r_y1": 121.82, "r_x2": 286.37, "r_y2": 112.92, "r_x3": 50.11, "r_y3": 112.92, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 133.78, "r_x1": 286.37, "r_y1": 133.78, "r_x2": 286.37, "r_y2": 124.87, "r_x3": 50.11, "r_y3": 124.87, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 145.73, "r_x1": 286.37, "r_y1": 145.73, "r_x2": 286.37, "r_y2": 136.83, "r_x3": 50.11, "r_y3": 136.83, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 157.69, "r_x1": 286.37, "r_y1": 157.69, "r_x2": 286.37, "r_y2": 148.78, "r_x3": 50.11, "r_y3": 148.78, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 169.64, "r_x1": 286.37, "r_y1": 169.64, "r_x2": 286.37, "r_y2": 160.74, "r_x3": 50.11, "r_y3": 160.74, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 181.6, "r_x1": 286.37, "r_y1": 181.6, "r_x2": 286.37, "r_y2": 172.69, "r_x3": 50.11, "r_y3": 172.69, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 193.55, "r_x1": 286.37, "r_y1": 193.55, "r_x2": 286.37, "r_y2": 184.65, "r_x3": 50.11, "r_y3": 184.65, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 205.51, "r_x1": 286.37, "r_y1": 205.51, "r_x2": 286.37, "r_y2": 196.6, "r_x3": 50.11, "r_y3": 196.6, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 217.46, "r_x1": 286.37, "r_y1": 217.46, "r_x2": 286.37, "r_y2": 208.56, "r_x3": 50.11, "r_y3": 208.56, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 229.42, "r_x1": 286.37, "r_y1": 229.42, "r_x2": 286.37, "r_y2": 220.51, "r_x3": 50.11, "r_y3": 220.51, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 241.37, "r_x1": 286.37, "r_y1": 241.37, "r_x2": 286.37, "r_y2": 232.47, "r_x3": 50.11, "r_y3": 232.47, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 253.33, "r_x1": 286.37, "r_y1": 253.33, "r_x2": 286.37, "r_y2": 244.42, "r_x3": 50.11, "r_y3": 244.42, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 265.28, "r_x1": 286.37, "r_y1": 265.28, "r_x2": 286.37, "r_y2": 256.38, "r_x3": 50.11, "r_y3": 256.38, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 277.24, "r_x1": 286.37, "r_y1": 277.24, "r_x2": 286.37, "r_y2": 268.33, "r_x3": 50.11, "r_y3": 268.33, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 289.2, "r_x1": 68.65, "r_y1": 289.2, "r_x2": 68.65, "r_y2": 280.29, "r_x3": 50.11, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.57, "r_y0": 289.2, "r_x1": 286.37, "r_y1": 289.2, "r_x2": 286.37, "r_y2": 280.29, "r_x3": 75.57, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 301.15, "r_x1": 286.37, "r_y1": 301.15, "r_x2": 286.37, "r_y2": 292.24, "r_x3": 50.11, "r_y3": 292.24, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 313.11, "r_x1": 75.7, "r_y1": 313.11, "r_x2": 75.7, "r_y2": 304.2, "r_x3": 50.11, "r_y3": 304.2, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 318.0, "r": 286.37, "b": 434.5, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 326.9, "r_x1": 286.36, "r_y1": 326.9, "r_x2": 286.36, "r_y2": 318.0, "r_x3": 62.07, "r_y3": 318.0, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 338.86, "r_x1": 286.37, "r_y1": 338.86, "r_x2": 286.37, "r_y2": 329.95, "r_x3": 50.11, "r_y3": 329.95, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 350.81, "r_x1": 286.37, "r_y1": 350.81, "r_x2": 286.37, "r_y2": 341.91, "r_x3": 50.11, "r_y3": 341.91, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 362.77, "r_x1": 286.37, "r_y1": 362.77, "r_x2": 286.37, "r_y2": 353.86, "r_x3": 50.11, "r_y3": 353.86, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 374.72, "r_x1": 286.37, "r_y1": 374.72, "r_x2": 286.37, "r_y2": 365.82, "r_x3": 50.11, "r_y3": 365.82, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 386.68, "r_x1": 141.59, "r_y1": 386.68, "r_x2": 141.59, "r_y2": 377.77, "r_x3": 50.11, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.7, "r_y0": 386.68, "r_x1": 286.37, "r_y1": 386.68, "r_x2": 286.37, "r_y2": 377.77, "r_x3": 148.7, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 398.63, "r_x1": 286.37, "r_y1": 398.63, "r_x2": 286.37, "r_y2": 389.73, "r_x3": 50.11, "r_y3": 389.73, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 410.59, "r_x1": 286.37, "r_y1": 410.59, "r_x2": 286.37, "r_y2": 401.68, "r_x3": 50.11, "r_y3": 401.68, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 422.54, "r_x1": 286.37, "r_y1": 422.54, "r_x2": 286.37, "r_y2": 413.64, "r_x3": 50.11, "r_y3": 413.64, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 434.5, "r_x1": 216.4, "r_y1": 434.5, "r_x2": 216.4, "r_y2": 425.59, "r_x3": 50.11, "r_y3": 425.59, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 439.39, "r": 286.37, "b": 627.62, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 448.3, "r_x1": 286.36, "r_y1": 448.3, "r_x2": 286.36, "r_y2": 439.39, "r_x3": 62.07, "r_y3": 439.39, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.25, "r_x1": 172.14, "r_y1": 460.25, "r_x2": 172.14, "r_y2": 451.34, "r_x3": 50.11, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.15, "r_y0": 460.02, "r_x1": 224.71, "r_y1": 460.02, "r_x2": 224.71, "r_y2": 451.43, "r_x3": 174.15, "r_y3": 451.43, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.71, "r_y0": 460.25, "r_x1": 286.37, "r_y1": 460.25, "r_x2": 286.37, "r_y2": 451.34, "r_x3": 224.71, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.21, "r_x1": 286.37, "r_y1": 472.21, "r_x2": 286.37, "r_y2": 463.3, "r_x3": 50.11, "r_y3": 463.3, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.16, "r_x1": 286.37, "r_y1": 484.16, "r_x2": 286.37, "r_y2": 475.26, "r_x3": 50.11, "r_y3": 475.26, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 496.12, "r_x1": 286.37, "r_y1": 496.12, "r_x2": 286.37, "r_y2": 487.21, "r_x3": 50.11, "r_y3": 487.21, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 508.07, "r_x1": 286.37, "r_y1": 508.07, "r_x2": 286.37, "r_y2": 499.17, "r_x3": 50.11, "r_y3": 499.17, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 520.03, "r_x1": 286.37, "r_y1": 520.03, "r_x2": 286.37, "r_y2": 511.12, "r_x3": 50.11, "r_y3": 511.12, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.98, "r_x1": 286.37, "r_y1": 531.98, "r_x2": 286.37, "r_y2": 523.08, "r_x3": 50.11, "r_y3": 523.08, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.94, "r_x1": 286.37, "r_y1": 543.94, "r_x2": 286.37, "r_y2": 535.03, "r_x3": 50.11, "r_y3": 535.03, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.89, "r_x1": 286.37, "r_y1": 555.89, "r_x2": 286.37, "r_y2": 546.99, "r_x3": 50.11, "r_y3": 546.99, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.85, "r_x1": 286.37, "r_y1": 567.85, "r_x2": 286.37, "r_y2": 558.94, "r_x3": 50.11, "r_y3": 558.94, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.8, "r_x1": 286.37, "r_y1": 579.8, "r_x2": 286.37, "r_y2": 570.9, "r_x3": 50.11, "r_y3": 570.9, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.76, "r_x1": 286.37, "r_y1": 591.76, "r_x2": 286.37, "r_y2": 582.85, "r_x3": 50.11, "r_y3": 582.85, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.71, "r_x1": 286.37, "r_y1": 603.71, "r_x2": 286.37, "r_y2": 594.81, "r_x3": 50.11, "r_y3": 594.81, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.67, "r_x1": 286.37, "r_y1": 615.67, "r_x2": 286.37, "r_y2": 606.76, "r_x3": 50.11, "r_y3": 606.76, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.62, "r_x1": 209.75, "r_y1": 627.62, "r_x2": 209.75, "r_y2": 618.72, "r_x3": 50.11, "r_y3": 618.72, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 632.51, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 641.42, "r_x1": 286.36, "r_y1": 641.42, "r_x2": 286.36, "r_y2": 632.51, "r_x3": 62.07, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.43, "r_x3": 50.11, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 310.68, "t": 73.19, "r": 542.95, "b": 155.22, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 9, "label": "caption", "bbox": { "l": 308.86, "t": 167.66, "r": 545.12, "b": 224.39, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 176.57, "r_x1": 344.62, "r_y1": 176.57, "r_x2": 344.62, "r_y2": 167.66, "r_x3": 308.86, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.08, "r_y0": 176.57, "r_x1": 380.45, "r_y1": 176.57, "r_x2": 380.45, "r_y2": 167.66, "r_x3": 361.08, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.57, "r_y0": 176.34, "r_x1": 468.68, "r_y1": 176.34, "r_x2": 468.68, "r_y2": 167.75, "r_x3": 386.57, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.8, "r_y0": 176.57, "r_x1": 489.18, "r_y1": 176.57, "r_x2": 489.18, "r_y2": 167.66, "r_x3": 474.8, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.3, "r_y0": 176.34, "r_x1": 545.11, "r_y1": 176.34, "r_x2": 545.11, "r_y2": 167.75, "r_x3": 495.3, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 188.29, "r_x1": 341.16, "r_y1": 188.29, "r_x2": 341.16, "r_y2": 179.71, "r_x3": 308.86, "r_y3": 179.71, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.46, "r_y0": 188.52, "r_x1": 545.11, "r_y1": 188.52, "r_x2": 545.11, "r_y2": 179.62, "r_x3": 343.46, "r_y3": 179.62, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 200.48, "r_x1": 545.12, "r_y1": 200.48, "r_x2": 545.12, "r_y2": 191.57, "r_x3": 308.86, "r_y3": 191.57, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 212.43, "r_x1": 545.11, "r_y1": 212.43, "r_x2": 545.11, "r_y2": 203.53, "r_x3": 308.86, "r_y3": 203.53, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 224.39, "r_x1": 523.93, "r_y1": 224.39, "r_x2": 523.93, "r_y2": 215.48, "r_x3": 308.86, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 308.86, "t": 249.62, "r": 545.12, "b": 294.39, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.53, "r_x1": 545.12, "r_y1": 258.53, "r_x2": 545.12, "r_y2": 249.62, "r_x3": 308.86, "r_y3": 249.62, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.48, "r_x1": 545.12, "r_y1": 270.48, "r_x2": 545.12, "r_y2": 261.58, "r_x3": 308.86, "r_y3": 261.58, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.44, "r_x1": 545.12, "r_y1": 282.44, "r_x2": 545.12, "r_y2": 273.53, "r_x3": 308.86, "r_y3": 273.53, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.39, "r_x1": 436.82, "r_y1": 294.39, "r_x2": 436.82, "r_y2": 285.49, "r_x3": 308.86, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 320.82, "t": 297.77, "r": 542.74, "b": 306.68, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.68, "r_x1": 542.74, "r_y1": 306.68, "r_x2": 542.74, "r_y2": 297.77, "r_x3": 320.82, "r_y3": 297.77, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "section_header", "bbox": { "l": 308.86, "t": 321.18, "r": 444.94, "b": 331.93, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 331.93, "r_x1": 316.28, "r_y1": 331.93, "r_x2": 316.28, "r_y2": 321.18, "r_x3": 308.86, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18, "r_y0": 331.93, "r_x1": 444.94, "r_y1": 331.93, "r_x2": 444.94, "r_y2": 321.18, "r_x3": 326.18, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 341.94, "r": 545.12, "b": 446.49, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 350.85, "r_x1": 545.11, "r_y1": 350.85, "r_x2": 545.11, "r_y2": 341.94, "r_x3": 320.82, "r_y3": 341.94, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 362.8, "r_x1": 545.12, "r_y1": 362.8, "r_x2": 545.12, "r_y2": 353.89, "r_x3": 308.86, "r_y3": 353.89, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 374.76, "r_x1": 545.12, "r_y1": 374.76, "r_x2": 545.12, "r_y2": 365.85, "r_x3": 308.86, "r_y3": 365.85, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 386.71, "r_x1": 545.12, "r_y1": 386.71, "r_x2": 545.12, "r_y2": 377.8, "r_x3": 308.86, "r_y3": 377.8, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 398.67, "r_x1": 545.12, "r_y1": 398.67, "r_x2": 545.12, "r_y2": 389.76, "r_x3": 308.86, "r_y3": 389.76, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 410.62, "r_x1": 545.12, "r_y1": 410.62, "r_x2": 545.12, "r_y2": 401.71, "r_x3": 308.86, "r_y3": 401.71, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 422.58, "r_x1": 545.12, "r_y1": 422.58, "r_x2": 545.12, "r_y2": 413.67, "r_x3": 308.86, "r_y3": 413.67, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 434.53, "r_x1": 545.12, "r_y1": 434.53, "r_x2": 545.12, "r_y2": 425.63, "r_x3": 308.86, "r_y3": 425.63, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 446.49, "r_x1": 437.94, "r_y1": 446.49, "r_x2": 437.94, "r_y2": 437.58, "r_x3": 308.86, "r_y3": 437.58, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 308.86, "t": 457.69, "r": 420.16, "b": 467.55, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 467.55, "r_x1": 323.14, "r_y1": 467.55, "r_x2": 323.14, "r_y2": 457.69, "r_x3": 308.86, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66, "r_y0": 467.55, "r_x1": 420.16, "r_y1": 467.55, "r_x2": 420.16, "r_y2": 457.69, "r_x3": 332.66, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 476.77, "r": 545.12, "b": 665.0, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 485.67, "r_x1": 545.11, "r_y1": 485.67, "r_x2": 545.11, "r_y2": 476.77, "r_x3": 320.82, "r_y3": 476.77, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.63, "r_x1": 509.02, "r_y1": 497.63, "r_x2": 509.02, "r_y2": 488.72, "r_x3": 308.86, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.59, "r_y0": 497.63, "r_x1": 523.06, "r_y1": 497.63, "r_x2": 523.06, "r_y2": 488.72, "r_x3": 515.59, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.63, "r_x1": 545.12, "r_y1": 497.63, "r_x2": 545.12, "r_y2": 488.72, "r_x3": 529.62, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.35, "r_x1": 406.35, "r_y1": 509.35, "r_x2": 406.35, "r_y2": 500.76, "r_x3": 308.86, "r_y3": 500.76, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87, "r_y0": 509.58, "r_x1": 545.11, "r_y1": 509.58, "r_x2": 545.11, "r_y2": 500.68, "r_x3": 408.87, "r_y3": 500.68, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.54, "r_x1": 409.39, "r_y1": 521.54, "r_x2": 409.39, "r_y2": 512.63, "r_x3": 308.86, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.73, "r_y0": 521.54, "r_x1": 545.12, "r_y1": 521.54, "r_x2": 545.12, "r_y2": 512.63, "r_x3": 416.73, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.49, "r_x1": 436.19, "r_y1": 533.49, "r_x2": 436.19, "r_y2": 524.59, "r_x3": 308.86, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 533.26, "r_x1": 513.87, "r_y1": 533.26, "r_x2": 513.87, "r_y2": 524.68, "r_x3": 439.53, "r_y3": 524.68, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43, "r_y0": 533.49, "r_x1": 545.11, "r_y1": 533.49, "r_x2": 545.11, "r_y2": 524.59, "r_x3": 517.43, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.45, "r_x1": 545.12, "r_y1": 545.45, "r_x2": 545.12, "r_y2": 536.54, "r_x3": 308.86, "r_y3": 536.54, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.4, "r_x1": 358.55, "r_y1": 557.4, "r_x2": 358.55, "r_y2": 548.5, "r_x3": 308.86, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19, "r_y0": 557.4, "r_x1": 545.12, "r_y1": 557.4, "r_x2": 545.12, "r_y2": 548.5, "r_x3": 365.19, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.36, "r_x1": 352.41, "r_y1": 569.36, "r_x2": 352.41, "r_y2": 560.45, "r_x3": 308.86, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.41, "r_y0": 569.14, "r_x1": 360.16, "r_y1": 569.14, "r_x2": 360.16, "r_y2": 560.29, "r_x3": 352.41, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.16, "r_y0": 569.36, "r_x1": 367.91, "r_y1": 569.36, "r_x2": 367.91, "r_y2": 560.45, "r_x3": 360.16, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.91, "r_y0": 569.14, "r_x1": 375.66, "r_y1": 569.14, "r_x2": 375.66, "r_y2": 560.29, "r_x3": 367.91, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.66, "r_y0": 569.36, "r_x1": 545.11, "r_y1": 569.36, "r_x2": 545.11, "r_y2": 560.45, "r_x3": 375.66, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.31, "r_x1": 545.11, "r_y1": 581.31, "r_x2": 545.11, "r_y2": 572.41, "r_x3": 308.86, "r_y3": 572.41, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.27, "r_x1": 483.12, "r_y1": 593.27, "r_x2": 483.12, "r_y2": 584.36, "r_x3": 308.86, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 593.05, "r_x1": 490.87, "r_y1": 593.05, "r_x2": 490.87, "r_y2": 584.2, "r_x3": 483.12, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.87, "r_y0": 593.27, "r_x1": 545.11, "r_y1": 593.27, "r_x2": 545.11, "r_y2": 584.36, "r_x3": 490.87, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.22, "r_x1": 545.11, "r_y1": 605.22, "r_x2": 545.11, "r_y2": 596.32, "r_x3": 308.86, "r_y3": 596.32, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.18, "r_x1": 329.64, "r_y1": 617.18, "r_x2": 329.64, "r_y2": 608.27, "r_x3": 308.86, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.65, "r_y0": 616.96, "r_x1": 337.39, "r_y1": 616.96, "r_x2": 337.39, "r_y2": 608.11, "r_x3": 329.65, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39, "r_y0": 617.18, "r_x1": 468.59, "r_y1": 617.18, "r_x2": 468.59, "r_y2": 608.27, "r_x3": 337.39, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59, "r_y0": 616.96, "r_x1": 476.34, "r_y1": 616.96, "r_x2": 476.34, "r_y2": 608.11, "r_x3": 468.59, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.34, "r_y0": 617.18, "r_x1": 545.12, "r_y1": 617.18, "r_x2": 545.12, "r_y2": 608.27, "r_x3": 476.34, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.13, "r_x1": 545.11, "r_y1": 629.13, "r_x2": 545.11, "r_y2": 620.23, "r_x3": 308.86, "r_y3": 620.23, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.09, "r_x1": 545.12, "r_y1": 641.09, "r_x2": 545.12, "r_y2": 632.18, "r_x3": 308.86, "r_y3": 632.18, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.04, "r_x1": 545.12, "r_y1": 653.04, "r_x2": 545.12, "r_y2": 644.14, "r_x3": 308.86, "r_y3": 644.14, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.0, "r_x1": 449.42, "r_y1": 665.0, "r_x2": 449.42, "r_y2": 656.09, "r_x3": 308.86, "r_y3": 656.09, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 668.26, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.22, "r_x1": 431.91, "r_y1": 677.22, "r_x2": 431.91, "r_y2": 668.26, "r_x3": 320.82, "r_y3": 668.26, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 439.5, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.11, "r_y1": 689.24, "r_x2": 545.11, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "8": { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.68, "t": 73.19, "r": 542.95, "b": 155.22, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 10, "page_no": 3, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 212.28, "r_y1": 96.07, "r_x2": 212.28, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)." }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 100.96, "r": 286.37, "b": 313.11, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 109.87, "r_x1": 286.37, "r_y1": 109.87, "r_x2": 286.37, "r_y2": 100.96, "r_x3": 62.07, "r_y3": 100.96, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 121.82, "r_x1": 286.37, "r_y1": 121.82, "r_x2": 286.37, "r_y2": 112.92, "r_x3": 50.11, "r_y3": 112.92, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 133.78, "r_x1": 286.37, "r_y1": 133.78, "r_x2": 286.37, "r_y2": 124.87, "r_x3": 50.11, "r_y3": 124.87, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 145.73, "r_x1": 286.37, "r_y1": 145.73, "r_x2": 286.37, "r_y2": 136.83, "r_x3": 50.11, "r_y3": 136.83, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 157.69, "r_x1": 286.37, "r_y1": 157.69, "r_x2": 286.37, "r_y2": 148.78, "r_x3": 50.11, "r_y3": 148.78, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 169.64, "r_x1": 286.37, "r_y1": 169.64, "r_x2": 286.37, "r_y2": 160.74, "r_x3": 50.11, "r_y3": 160.74, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 181.6, "r_x1": 286.37, "r_y1": 181.6, "r_x2": 286.37, "r_y2": 172.69, "r_x3": 50.11, "r_y3": 172.69, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 193.55, "r_x1": 286.37, "r_y1": 193.55, "r_x2": 286.37, "r_y2": 184.65, "r_x3": 50.11, "r_y3": 184.65, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 205.51, "r_x1": 286.37, "r_y1": 205.51, "r_x2": 286.37, "r_y2": 196.6, "r_x3": 50.11, "r_y3": 196.6, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 217.46, "r_x1": 286.37, "r_y1": 217.46, "r_x2": 286.37, "r_y2": 208.56, "r_x3": 50.11, "r_y3": 208.56, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 229.42, "r_x1": 286.37, "r_y1": 229.42, "r_x2": 286.37, "r_y2": 220.51, "r_x3": 50.11, "r_y3": 220.51, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 241.37, "r_x1": 286.37, "r_y1": 241.37, "r_x2": 286.37, "r_y2": 232.47, "r_x3": 50.11, "r_y3": 232.47, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 253.33, "r_x1": 286.37, "r_y1": 253.33, "r_x2": 286.37, "r_y2": 244.42, "r_x3": 50.11, "r_y3": 244.42, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 265.28, "r_x1": 286.37, "r_y1": 265.28, "r_x2": 286.37, "r_y2": 256.38, "r_x3": 50.11, "r_y3": 256.38, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 277.24, "r_x1": 286.37, "r_y1": 277.24, "r_x2": 286.37, "r_y2": 268.33, "r_x3": 50.11, "r_y3": 268.33, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 289.2, "r_x1": 68.65, "r_y1": 289.2, "r_x2": 68.65, "r_y2": 280.29, "r_x3": 50.11, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.57, "r_y0": 289.2, "r_x1": 286.37, "r_y1": 289.2, "r_x2": 286.37, "r_y2": 280.29, "r_x3": 75.57, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 301.15, "r_x1": 286.37, "r_y1": 301.15, "r_x2": 286.37, "r_y2": 292.24, "r_x3": 50.11, "r_y3": 292.24, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 313.11, "r_x1": 75.7, "r_y1": 313.11, "r_x2": 75.7, "r_y2": 304.2, "r_x3": 50.11, "r_y3": 304.2, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 318.0, "r": 286.37, "b": 434.5, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 326.9, "r_x1": 286.36, "r_y1": 326.9, "r_x2": 286.36, "r_y2": 318.0, "r_x3": 62.07, "r_y3": 318.0, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 338.86, "r_x1": 286.37, "r_y1": 338.86, "r_x2": 286.37, "r_y2": 329.95, "r_x3": 50.11, "r_y3": 329.95, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 350.81, "r_x1": 286.37, "r_y1": 350.81, "r_x2": 286.37, "r_y2": 341.91, "r_x3": 50.11, "r_y3": 341.91, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 362.77, "r_x1": 286.37, "r_y1": 362.77, "r_x2": 286.37, "r_y2": 353.86, "r_x3": 50.11, "r_y3": 353.86, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 374.72, "r_x1": 286.37, "r_y1": 374.72, "r_x2": 286.37, "r_y2": 365.82, "r_x3": 50.11, "r_y3": 365.82, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 386.68, "r_x1": 141.59, "r_y1": 386.68, "r_x2": 141.59, "r_y2": 377.77, "r_x3": 50.11, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.7, "r_y0": 386.68, "r_x1": 286.37, "r_y1": 386.68, "r_x2": 286.37, "r_y2": 377.77, "r_x3": 148.7, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 398.63, "r_x1": 286.37, "r_y1": 398.63, "r_x2": 286.37, "r_y2": 389.73, "r_x3": 50.11, "r_y3": 389.73, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 410.59, "r_x1": 286.37, "r_y1": 410.59, "r_x2": 286.37, "r_y2": 401.68, "r_x3": 50.11, "r_y3": 401.68, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 422.54, "r_x1": 286.37, "r_y1": 422.54, "r_x2": 286.37, "r_y2": 413.64, "r_x3": 50.11, "r_y3": 413.64, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 434.5, "r_x1": 216.4, "r_y1": 434.5, "r_x2": 216.4, "r_y2": 425.59, "r_x3": 50.11, "r_y3": 425.59, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data." }, { "label": "text", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 439.39, "r": 286.37, "b": 627.62, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 448.3, "r_x1": 286.36, "r_y1": 448.3, "r_x2": 286.36, "r_y2": 439.39, "r_x3": 62.07, "r_y3": 439.39, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.25, "r_x1": 172.14, "r_y1": 460.25, "r_x2": 172.14, "r_y2": 451.34, "r_x3": 50.11, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.15, "r_y0": 460.02, "r_x1": 224.71, "r_y1": 460.02, "r_x2": 224.71, "r_y2": 451.43, "r_x3": 174.15, "r_y3": 451.43, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.71, "r_y0": 460.25, "r_x1": 286.37, "r_y1": 460.25, "r_x2": 286.37, "r_y2": 451.34, "r_x3": 224.71, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.21, "r_x1": 286.37, "r_y1": 472.21, "r_x2": 286.37, "r_y2": 463.3, "r_x3": 50.11, "r_y3": 463.3, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.16, "r_x1": 286.37, "r_y1": 484.16, "r_x2": 286.37, "r_y2": 475.26, "r_x3": 50.11, "r_y3": 475.26, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 496.12, "r_x1": 286.37, "r_y1": 496.12, "r_x2": 286.37, "r_y2": 487.21, "r_x3": 50.11, "r_y3": 487.21, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 508.07, "r_x1": 286.37, "r_y1": 508.07, "r_x2": 286.37, "r_y2": 499.17, "r_x3": 50.11, "r_y3": 499.17, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 520.03, "r_x1": 286.37, "r_y1": 520.03, "r_x2": 286.37, "r_y2": 511.12, "r_x3": 50.11, "r_y3": 511.12, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.98, "r_x1": 286.37, "r_y1": 531.98, "r_x2": 286.37, "r_y2": 523.08, "r_x3": 50.11, "r_y3": 523.08, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.94, "r_x1": 286.37, "r_y1": 543.94, "r_x2": 286.37, "r_y2": 535.03, "r_x3": 50.11, "r_y3": 535.03, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.89, "r_x1": 286.37, "r_y1": 555.89, "r_x2": 286.37, "r_y2": 546.99, "r_x3": 50.11, "r_y3": 546.99, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.85, "r_x1": 286.37, "r_y1": 567.85, "r_x2": 286.37, "r_y2": 558.94, "r_x3": 50.11, "r_y3": 558.94, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.8, "r_x1": 286.37, "r_y1": 579.8, "r_x2": 286.37, "r_y2": 570.9, "r_x3": 50.11, "r_y3": 570.9, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.76, "r_x1": 286.37, "r_y1": 591.76, "r_x2": 286.37, "r_y2": 582.85, "r_x3": 50.11, "r_y3": 582.85, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.71, "r_x1": 286.37, "r_y1": 603.71, "r_x2": 286.37, "r_y2": 594.81, "r_x3": 50.11, "r_y3": 594.81, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.67, "r_x1": 286.37, "r_y1": 615.67, "r_x2": 286.37, "r_y2": 606.76, "r_x3": 50.11, "r_y3": 606.76, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.62, "r_x1": 209.75, "r_y1": 627.62, "r_x2": 209.75, "r_y2": 618.72, "r_x3": 50.11, "r_y3": 618.72, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain." }, { "label": "text", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 632.51, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 641.42, "r_x1": 286.36, "r_y1": 641.42, "r_x2": 286.36, "r_y2": 632.51, "r_x3": 62.07, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.43, "r_x3": 50.11, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third" }, { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.68, "t": 73.19, "r": 542.95, "b": 155.22, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 9, "page_no": 3, "cluster": { "id": 9, "label": "caption", "bbox": { "l": 308.86, "t": 167.66, "r": 545.12, "b": 224.39, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 176.57, "r_x1": 344.62, "r_y1": 176.57, "r_x2": 344.62, "r_y2": 167.66, "r_x3": 308.86, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.08, "r_y0": 176.57, "r_x1": 380.45, "r_y1": 176.57, "r_x2": 380.45, "r_y2": 167.66, "r_x3": 361.08, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.57, "r_y0": 176.34, "r_x1": 468.68, "r_y1": 176.34, "r_x2": 468.68, "r_y2": 167.75, "r_x3": 386.57, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.8, "r_y0": 176.57, "r_x1": 489.18, "r_y1": 176.57, "r_x2": 489.18, "r_y2": 167.66, "r_x3": 474.8, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.3, "r_y0": 176.34, "r_x1": 545.11, "r_y1": 176.34, "r_x2": 545.11, "r_y2": 167.75, "r_x3": 495.3, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 188.29, "r_x1": 341.16, "r_y1": 188.29, "r_x2": 341.16, "r_y2": 179.71, "r_x3": 308.86, "r_y3": 179.71, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.46, "r_y0": 188.52, "r_x1": 545.11, "r_y1": 188.52, "r_x2": 545.11, "r_y2": 179.62, "r_x3": 343.46, "r_y3": 179.62, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 200.48, "r_x1": 545.12, "r_y1": 200.48, "r_x2": 545.12, "r_y2": 191.57, "r_x3": 308.86, "r_y3": 191.57, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 212.43, "r_x1": 545.11, "r_y1": 212.43, "r_x2": 545.11, "r_y2": 203.53, "r_x3": 308.86, "r_y3": 203.53, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 224.39, "r_x1": 523.93, "r_y1": 224.39, "r_x2": 523.93, "r_y2": 215.48, "r_x3": 308.86, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank." }, { "label": "text", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "text", "bbox": { "l": 308.86, "t": 249.62, "r": 545.12, "b": 294.39, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.53, "r_x1": 545.12, "r_y1": 258.53, "r_x2": 545.12, "r_y2": 249.62, "r_x3": 308.86, "r_y3": 249.62, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.48, "r_x1": 545.12, "r_y1": 270.48, "r_x2": 545.12, "r_y2": 261.58, "r_x3": 308.86, "r_y3": 261.58, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.44, "r_x1": 545.12, "r_y1": 282.44, "r_x2": 545.12, "r_y2": 273.53, "r_x3": 308.86, "r_y3": 273.53, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.39, "r_x1": 436.82, "r_y1": 294.39, "r_x2": 436.82, "r_y2": 285.49, "r_x3": 308.86, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples." }, { "label": "text", "id": 13, "page_no": 3, "cluster": { "id": 13, "label": "text", "bbox": { "l": 320.82, "t": 297.77, "r": 542.74, "b": 306.68, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.68, "r_x1": 542.74, "r_y1": 306.68, "r_x2": 542.74, "r_y2": 297.77, "r_x3": 320.82, "r_y3": 297.77, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tab. 1 summarizes the various attributes of the datasets." }, { "label": "section_header", "id": 11, "page_no": 3, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 308.86, "t": 321.18, "r": 444.94, "b": 331.93, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 331.93, "r_x1": 316.28, "r_y1": 331.93, "r_x2": 316.28, "r_y2": 321.18, "r_x3": 308.86, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18, "r_y0": 331.93, "r_x1": 444.94, "r_y1": 331.93, "r_x2": 444.94, "r_y2": 321.18, "r_x3": 326.18, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. The TableFormer model" }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 341.94, "r": 545.12, "b": 446.49, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 350.85, "r_x1": 545.11, "r_y1": 350.85, "r_x2": 545.11, "r_y2": 341.94, "r_x3": 320.82, "r_y3": 341.94, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 362.8, "r_x1": 545.12, "r_y1": 362.8, "r_x2": 545.12, "r_y2": 353.89, "r_x3": 308.86, "r_y3": 353.89, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 374.76, "r_x1": 545.12, "r_y1": 374.76, "r_x2": 545.12, "r_y2": 365.85, "r_x3": 308.86, "r_y3": 365.85, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 386.71, "r_x1": 545.12, "r_y1": 386.71, "r_x2": 545.12, "r_y2": 377.8, "r_x3": 308.86, "r_y3": 377.8, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 398.67, "r_x1": 545.12, "r_y1": 398.67, "r_x2": 545.12, "r_y2": 389.76, "r_x3": 308.86, "r_y3": 389.76, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 410.62, "r_x1": 545.12, "r_y1": 410.62, "r_x2": 545.12, "r_y2": 401.71, "r_x3": 308.86, "r_y3": 401.71, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 422.58, "r_x1": 545.12, "r_y1": 422.58, "r_x2": 545.12, "r_y2": 413.67, "r_x3": 308.86, "r_y3": 413.67, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 434.53, "r_x1": 545.12, "r_y1": 434.53, "r_x2": 545.12, "r_y2": 425.63, "r_x3": 308.86, "r_y3": 425.63, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 446.49, "r_x1": 437.94, "r_y1": 446.49, "r_x2": 437.94, "r_y2": 437.58, "r_x3": 308.86, "r_y3": 437.58, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required." }, { "label": "section_header", "id": 12, "page_no": 3, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 308.86, "t": 457.69, "r": 420.16, "b": 467.55, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 467.55, "r_x1": 323.14, "r_y1": 467.55, "r_x2": 323.14, "r_y2": 457.69, "r_x3": 308.86, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66, "r_y0": 467.55, "r_x1": 420.16, "r_y1": 467.55, "r_x2": 420.16, "r_y2": 457.69, "r_x3": 332.66, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1. Model architecture." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 476.77, "r": 545.12, "b": 665.0, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 485.67, "r_x1": 545.11, "r_y1": 485.67, "r_x2": 545.11, "r_y2": 476.77, "r_x3": 320.82, "r_y3": 476.77, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.63, "r_x1": 509.02, "r_y1": 497.63, "r_x2": 509.02, "r_y2": 488.72, "r_x3": 308.86, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.59, "r_y0": 497.63, "r_x1": 523.06, "r_y1": 497.63, "r_x2": 523.06, "r_y2": 488.72, "r_x3": 515.59, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.63, "r_x1": 545.12, "r_y1": 497.63, "r_x2": 545.12, "r_y2": 488.72, "r_x3": 529.62, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.35, "r_x1": 406.35, "r_y1": 509.35, "r_x2": 406.35, "r_y2": 500.76, "r_x3": 308.86, "r_y3": 500.76, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87, "r_y0": 509.58, "r_x1": 545.11, "r_y1": 509.58, "r_x2": 545.11, "r_y2": 500.68, "r_x3": 408.87, "r_y3": 500.68, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.54, "r_x1": 409.39, "r_y1": 521.54, "r_x2": 409.39, "r_y2": 512.63, "r_x3": 308.86, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.73, "r_y0": 521.54, "r_x1": 545.12, "r_y1": 521.54, "r_x2": 545.12, "r_y2": 512.63, "r_x3": 416.73, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.49, "r_x1": 436.19, "r_y1": 533.49, "r_x2": 436.19, "r_y2": 524.59, "r_x3": 308.86, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 533.26, "r_x1": 513.87, "r_y1": 533.26, "r_x2": 513.87, "r_y2": 524.68, "r_x3": 439.53, "r_y3": 524.68, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43, "r_y0": 533.49, "r_x1": 545.11, "r_y1": 533.49, "r_x2": 545.11, "r_y2": 524.59, "r_x3": 517.43, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.45, "r_x1": 545.12, "r_y1": 545.45, "r_x2": 545.12, "r_y2": 536.54, "r_x3": 308.86, "r_y3": 536.54, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.4, "r_x1": 358.55, "r_y1": 557.4, "r_x2": 358.55, "r_y2": 548.5, "r_x3": 308.86, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19, "r_y0": 557.4, "r_x1": 545.12, "r_y1": 557.4, "r_x2": 545.12, "r_y2": 548.5, "r_x3": 365.19, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.36, "r_x1": 352.41, "r_y1": 569.36, "r_x2": 352.41, "r_y2": 560.45, "r_x3": 308.86, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.41, "r_y0": 569.14, "r_x1": 360.16, "r_y1": 569.14, "r_x2": 360.16, "r_y2": 560.29, "r_x3": 352.41, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.16, "r_y0": 569.36, "r_x1": 367.91, "r_y1": 569.36, "r_x2": 367.91, "r_y2": 560.45, "r_x3": 360.16, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.91, "r_y0": 569.14, "r_x1": 375.66, "r_y1": 569.14, "r_x2": 375.66, "r_y2": 560.29, "r_x3": 367.91, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.66, "r_y0": 569.36, "r_x1": 545.11, "r_y1": 569.36, "r_x2": 545.11, "r_y2": 560.45, "r_x3": 375.66, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.31, "r_x1": 545.11, "r_y1": 581.31, "r_x2": 545.11, "r_y2": 572.41, "r_x3": 308.86, "r_y3": 572.41, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.27, "r_x1": 483.12, "r_y1": 593.27, "r_x2": 483.12, "r_y2": 584.36, "r_x3": 308.86, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 593.05, "r_x1": 490.87, "r_y1": 593.05, "r_x2": 490.87, "r_y2": 584.2, "r_x3": 483.12, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.87, "r_y0": 593.27, "r_x1": 545.11, "r_y1": 593.27, "r_x2": 545.11, "r_y2": 584.36, "r_x3": 490.87, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.22, "r_x1": 545.11, "r_y1": 605.22, "r_x2": 545.11, "r_y2": 596.32, "r_x3": 308.86, "r_y3": 596.32, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.18, "r_x1": 329.64, "r_y1": 617.18, "r_x2": 329.64, "r_y2": 608.27, "r_x3": 308.86, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.65, "r_y0": 616.96, "r_x1": 337.39, "r_y1": 616.96, "r_x2": 337.39, "r_y2": 608.11, "r_x3": 329.65, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39, "r_y0": 617.18, "r_x1": 468.59, "r_y1": 617.18, "r_x2": 468.59, "r_y2": 608.27, "r_x3": 337.39, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59, "r_y0": 616.96, "r_x1": 476.34, "r_y1": 616.96, "r_x2": 476.34, "r_y2": 608.11, "r_x3": 468.59, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.34, "r_y0": 617.18, "r_x1": 545.12, "r_y1": 617.18, "r_x2": 545.12, "r_y2": 608.27, "r_x3": 476.34, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.13, "r_x1": 545.11, "r_y1": 629.13, "r_x2": 545.11, "r_y2": 620.23, "r_x3": 308.86, "r_y3": 620.23, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.09, "r_x1": 545.12, "r_y1": 641.09, "r_x2": 545.12, "r_y2": 632.18, "r_x3": 308.86, "r_y3": 632.18, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.04, "r_x1": 545.12, "r_y1": 653.04, "r_x2": 545.12, "r_y2": 644.14, "r_x3": 308.86, "r_y3": 644.14, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.0, "r_x1": 449.42, "r_y1": 665.0, "r_x2": 449.42, "r_y2": 656.09, "r_x3": 308.86, "r_y3": 656.09, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification." }, { "label": "text", "id": 7, "page_no": 3, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 668.26, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.22, "r_x1": 431.91, "r_y1": 677.22, "r_x2": 431.91, "r_y2": 668.26, "r_x3": 320.82, "r_y3": 668.26, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 439.5, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.11, "r_y1": 689.24, "r_x2": 545.11, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-" }, { "label": "page_footer", "id": 14, "page_no": 3, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" } ], "body": [ { "label": "text", "id": 10, "page_no": 3, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 96.07, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 212.28, "r_y1": 96.07, "r_x2": 212.28, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)." }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 100.96, "r": 286.37, "b": 313.11, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 109.87, "r_x1": 286.37, "r_y1": 109.87, "r_x2": 286.37, "r_y2": 100.96, "r_x3": 62.07, "r_y3": 100.96, "coord_origin": "TOPLEFT" }, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 121.82, "r_x1": 286.37, "r_y1": 121.82, "r_x2": 286.37, "r_y2": 112.92, "r_x3": 50.11, "r_y3": 112.92, "coord_origin": "TOPLEFT" }, "text": "is essential to train our models. In order to distinguish be-", "orig": "is essential to train our models. In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 133.78, "r_x1": 286.37, "r_y1": 133.78, "r_x2": 286.37, "r_y2": 124.87, "r_x3": 50.11, "r_y3": 124.87, "coord_origin": "TOPLEFT" }, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 145.73, "r_x1": 286.37, "r_y1": 145.73, "r_x2": 286.37, "r_y2": 136.83, "r_x3": 50.11, "r_y3": 136.83, "coord_origin": "TOPLEFT" }, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 157.69, "r_x1": 286.37, "r_y1": 157.69, "r_x2": 286.37, "r_y2": 148.78, "r_x3": 50.11, "r_y3": 148.78, "coord_origin": "TOPLEFT" }, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 169.64, "r_x1": 286.37, "r_y1": 169.64, "r_x2": 286.37, "r_y2": 160.74, "r_x3": 50.11, "r_y3": 160.74, "coord_origin": "TOPLEFT" }, "text": "tables (e.g. TableBank) or they narrow their scope only to", "orig": "tables (e.g. TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 181.6, "r_x1": 286.37, "r_y1": 181.6, "r_x2": 286.37, "r_y2": 172.69, "r_x3": 50.11, "r_y3": 172.69, "coord_origin": "TOPLEFT" }, "text": "non-empty cells. Therefore, it was imperative to introduce", "orig": "non-empty cells. Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 193.55, "r_x1": 286.37, "r_y1": 193.55, "r_x2": 286.37, "r_y2": 184.65, "r_x3": 50.11, "r_y3": 184.65, "coord_origin": "TOPLEFT" }, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 205.51, "r_x1": 286.37, "r_y1": 205.51, "r_x2": 286.37, "r_y2": 196.6, "r_x3": 50.11, "r_y3": 196.6, "coord_origin": "TOPLEFT" }, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 217.46, "r_x1": 286.37, "r_y1": 217.46, "r_x2": 286.37, "r_y2": 208.56, "r_x3": 50.11, "r_y3": 208.56, "coord_origin": "TOPLEFT" }, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 229.42, "r_x1": 286.37, "r_y1": 229.42, "r_x2": 286.37, "r_y2": 220.51, "r_x3": 50.11, "r_y3": 220.51, "coord_origin": "TOPLEFT" }, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 241.37, "r_x1": 286.37, "r_y1": 241.37, "r_x2": 286.37, "r_y2": 232.47, "r_x3": 50.11, "r_y3": 232.47, "coord_origin": "TOPLEFT" }, "text": "ers the table structure. Notice that each table cell may oc-", "orig": "ers the table structure. Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 253.33, "r_x1": 286.37, "r_y1": 253.33, "r_x2": 286.37, "r_y2": 244.42, "r_x3": 50.11, "r_y3": 244.42, "coord_origin": "TOPLEFT" }, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 265.28, "r_x1": 286.37, "r_y1": 265.28, "r_x2": 286.37, "r_y2": 256.38, "r_x3": 50.11, "r_y3": 256.38, "coord_origin": "TOPLEFT" }, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 277.24, "r_x1": 286.37, "r_y1": 277.24, "r_x2": 286.37, "r_y2": 268.33, "r_x3": 50.11, "r_y3": 268.33, "coord_origin": "TOPLEFT" }, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 289.2, "r_x1": 68.65, "r_y1": 289.2, "r_x2": 68.65, "r_y2": 280.29, "r_x3": 50.11, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 75.57, "r_y0": 289.2, "r_x1": 286.37, "r_y1": 289.2, "r_x2": 286.37, "r_y2": 280.29, "r_x3": 75.57, "r_y3": 280.29, "coord_origin": "TOPLEFT" }, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 301.15, "r_x1": 286.37, "r_y1": 301.15, "r_x2": 286.37, "r_y2": 292.24, "r_x3": 50.11, "r_y3": 292.24, "coord_origin": "TOPLEFT" }, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 313.11, "r_x1": 75.7, "r_y1": 313.11, "r_x2": 75.7, "r_y2": 304.2, "r_x3": 50.11, "r_y3": 304.2, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 318.0, "r": 286.37, "b": 434.5, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 326.9, "r_x1": 286.36, "r_y1": 326.9, "r_x2": 286.36, "r_y2": 318.0, "r_x3": 62.07, "r_y3": 318.0, "coord_origin": "TOPLEFT" }, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 338.86, "r_x1": 286.37, "r_y1": 338.86, "r_x2": 286.37, "r_y2": 329.95, "r_x3": 50.11, "r_y3": 329.95, "coord_origin": "TOPLEFT" }, "text": "all datasets are skewed towards simpler structures with", "orig": "all datasets are skewed towards simpler structures with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 350.81, "r_x1": 286.37, "r_y1": 350.81, "r_x2": 286.37, "r_y2": 341.91, "r_x3": 50.11, "r_y3": 341.91, "coord_origin": "TOPLEFT" }, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 362.77, "r_x1": 286.37, "r_y1": 362.77, "r_x2": 286.37, "r_y2": 353.86, "r_x3": 50.11, "r_y3": 353.86, "coord_origin": "TOPLEFT" }, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 374.72, "r_x1": 286.37, "r_y1": 374.72, "r_x2": 286.37, "r_y2": 365.82, "r_x3": 50.11, "r_y3": 365.82, "coord_origin": "TOPLEFT" }, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 386.68, "r_x1": 141.59, "r_y1": 386.68, "r_x2": 141.59, "r_y2": 377.77, "r_x3": 50.11, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.7, "r_y0": 386.68, "r_x1": 286.37, "r_y1": 386.68, "r_x2": 286.37, "r_y2": 377.77, "r_x3": 148.7, "r_y3": 377.77, "coord_origin": "TOPLEFT" }, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 398.63, "r_x1": 286.37, "r_y1": 398.63, "r_x2": 286.37, "r_y2": 389.73, "r_x3": 50.11, "r_y3": 389.73, "coord_origin": "TOPLEFT" }, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 410.59, "r_x1": 286.37, "r_y1": 410.59, "r_x2": 286.37, "r_y2": 401.68, "r_x3": 50.11, "r_y3": 401.68, "coord_origin": "TOPLEFT" }, "text": "Net) is restricted to a certain domain. Ultimately, the lack", "orig": "Net) is restricted to a certain domain. Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 422.54, "r_x1": 286.37, "r_y1": 422.54, "r_x2": 286.37, "r_y2": 413.64, "r_x3": 50.11, "r_y3": 413.64, "coord_origin": "TOPLEFT" }, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 434.5, "r_x1": 216.4, "r_y1": 434.5, "r_x2": 216.4, "r_y2": 425.59, "r_x3": 50.11, "r_y3": 425.59, "coord_origin": "TOPLEFT" }, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data." }, { "label": "text", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 439.39, "r": 286.37, "b": 627.62, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 448.3, "r_x1": 286.36, "r_y1": 448.3, "r_x2": 286.36, "r_y2": 439.39, "r_x3": 62.07, "r_y3": 439.39, "coord_origin": "TOPLEFT" }, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.25, "r_x1": 172.14, "r_y1": 460.25, "r_x2": 172.14, "r_y2": 451.34, "r_x3": 50.11, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.15, "r_y0": 460.02, "r_x1": 224.71, "r_y1": 460.02, "r_x2": 224.71, "r_y2": 451.43, "r_x3": 174.15, "r_y3": 451.43, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.71, "r_y0": 460.25, "r_x1": 286.37, "r_y1": 460.25, "r_x2": 286.37, "r_y2": 451.34, "r_x3": 224.71, "r_y3": 451.34, "coord_origin": "TOPLEFT" }, "text": ". This approach", "orig": ". This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.21, "r_x1": 286.37, "r_y1": 472.21, "r_x2": 286.37, "r_y2": 463.3, "r_x3": 50.11, "r_y3": 463.3, "coord_origin": "TOPLEFT" }, "text": "offers control over: 1) the size of the dataset, 2) the table", "orig": "offers control over: 1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.16, "r_x1": 286.37, "r_y1": 484.16, "r_x2": 286.37, "r_y2": 475.26, "r_x3": 50.11, "r_y3": 475.26, "coord_origin": "TOPLEFT" }, "text": "structure, 3) the table style and 4) the type of content. The", "orig": "structure, 3) the table style and 4) the type of content. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 496.12, "r_x1": 286.37, "r_y1": 496.12, "r_x2": 286.37, "r_y2": 487.21, "r_x3": 50.11, "r_y3": 487.21, "coord_origin": "TOPLEFT" }, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 508.07, "r_x1": 286.37, "r_y1": 508.07, "r_x2": 286.37, "r_y2": 499.17, "r_x3": 50.11, "r_y3": 499.17, "coord_origin": "TOPLEFT" }, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 520.03, "r_x1": 286.37, "r_y1": 520.03, "r_x2": 286.37, "r_y2": 511.12, "r_x3": 50.11, "r_y3": 511.12, "coord_origin": "TOPLEFT" }, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.98, "r_x1": 286.37, "r_y1": 531.98, "r_x2": 286.37, "r_y2": 523.08, "r_x3": 50.11, "r_y3": 523.08, "coord_origin": "TOPLEFT" }, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.94, "r_x1": 286.37, "r_y1": 543.94, "r_x2": 286.37, "r_y2": 535.03, "r_x3": 50.11, "r_y3": 535.03, "coord_origin": "TOPLEFT" }, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.89, "r_x1": 286.37, "r_y1": 555.89, "r_x2": 286.37, "r_y2": 546.99, "r_x3": 50.11, "r_y3": 546.99, "coord_origin": "TOPLEFT" }, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.85, "r_x1": 286.37, "r_y1": 567.85, "r_x2": 286.37, "r_y2": 558.94, "r_x3": 50.11, "r_y3": 558.94, "coord_origin": "TOPLEFT" }, "text": "corpora. By controlling the size and scope of the synthetic", "orig": "corpora. By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.8, "r_x1": 286.37, "r_y1": 579.8, "r_x2": 286.37, "r_y2": 570.9, "r_x3": 50.11, "r_y3": 570.9, "coord_origin": "TOPLEFT" }, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.76, "r_x1": 286.37, "r_y1": 591.76, "r_x2": 286.37, "r_y2": 582.85, "r_x3": 50.11, "r_y3": 582.85, "coord_origin": "TOPLEFT" }, "text": "variety of different conditions. For example, we can first", "orig": "variety of different conditions. For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.71, "r_x1": 286.37, "r_y1": 603.71, "r_x2": 286.37, "r_y2": 594.81, "r_x3": 50.11, "r_y3": 594.81, "coord_origin": "TOPLEFT" }, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.67, "r_x1": 286.37, "r_y1": 615.67, "r_x2": 286.37, "r_y2": 606.76, "r_x3": 50.11, "r_y3": 606.76, "coord_origin": "TOPLEFT" }, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.62, "r_x1": 209.75, "r_y1": 627.62, "r_x2": 209.75, "r_y2": 618.72, "r_x3": 50.11, "r_y3": 618.72, "coord_origin": "TOPLEFT" }, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain." }, { "label": "text", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 632.51, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 641.42, "r_x1": 286.36, "r_y1": 641.42, "r_x2": 286.36, "r_y2": 632.51, "r_x3": 62.07, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.43, "r_x3": 50.11, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "generated text. The first two synthetic datasets have been", "orig": "generated text. The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third" }, { "label": "table", "id": 8, "page_no": 3, "cluster": { "id": 8, "label": "table", "bbox": { "l": 310.68, "t": 73.19, "r": 542.95, "b": 155.22, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 17, "label": "text", "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.33, "r_y0": 82.52, "r_x1": 430.9, "r_y1": 82.52, "r_x2": 430.9, "r_y2": 73.61, "r_x3": 412.33, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.86, "r_y0": 82.52, "r_x1": 464.45, "r_y1": 82.52, "r_x2": 464.45, "r_y2": 73.61, "r_x3": 442.86, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.79, "r_y0": 82.52, "r_x1": 494.94, "r_y1": 82.52, "r_x2": 494.94, "r_y2": 73.61, "r_x3": 477.79, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.28, "r_y0": 82.52, "r_x1": 536.91, "r_y1": 82.52, "r_x2": 536.91, "r_y2": 73.61, "r_x3": 508.28, "r_y3": 73.61, "coord_origin": "TOPLEFT" }, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 94.87, "r_x1": 361.64, "r_y1": 94.87, "r_x2": 361.64, "r_y2": 85.97, "r_x3": 317.06, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 94.88, "r_x1": 425.38, "r_y1": 94.88, "r_x2": 425.38, "r_y2": 85.67, "r_x3": 417.86, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 94.88, "r_x1": 457.42, "r_y1": 94.88, "r_x2": 457.42, "r_y2": 85.67, "r_x3": 449.9, "r_y3": 85.67, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 94.87, "r_x1": 496.33, "r_y1": 94.87, "r_x2": 496.33, "r_y2": 85.97, "r_x3": 476.4, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 94.87, "r_x1": 532.56, "r_y1": 94.87, "r_x2": 532.56, "r_y2": 85.97, "r_x3": 512.63, "r_y3": 85.97, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 106.83, "r_x1": 359.43, "r_y1": 106.83, "r_x2": 359.43, "r_y2": 97.92, "r_x3": 317.06, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 106.84, "r_x1": 425.38, "r_y1": 106.84, "r_x2": 425.38, "r_y2": 97.62, "r_x3": 417.86, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 106.84, "r_x1": 457.42, "r_y1": 106.84, "r_x2": 457.42, "r_y2": 97.62, "r_x3": 449.9, "r_y3": 97.62, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 106.83, "r_x1": 496.33, "r_y1": 106.83, "r_x2": 496.33, "r_y2": 97.92, "r_x3": 476.4, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.46, "r_y0": 106.83, "r_x1": 531.73, "r_y1": 106.83, "r_x2": 531.73, "r_y2": 97.92, "r_x3": 513.46, "r_y3": 97.92, "coord_origin": "TOPLEFT" }, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 118.78, "r_x1": 359.98, "r_y1": 118.78, "r_x2": 359.98, "r_y2": 109.88, "r_x3": 317.06, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 118.79, "r_x1": 425.38, "r_y1": 118.79, "r_x2": 425.38, "r_y2": 109.58, "r_x3": 417.86, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.81, "r_y0": 118.79, "r_x1": 456.5, "r_y1": 118.79, "r_x2": 456.5, "r_y2": 109.58, "r_x3": 450.81, "r_y3": 109.58, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 118.78, "r_x1": 496.33, "r_y1": 118.78, "r_x2": 496.33, "r_y2": 109.88, "r_x3": 476.4, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.25, "r_y0": 118.78, "r_x1": 533.95, "r_y1": 118.78, "r_x2": 533.95, "r_y2": 109.88, "r_x3": 511.25, "r_y3": 109.88, "coord_origin": "TOPLEFT" }, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 130.74, "r_x1": 400.38, "r_y1": 130.74, "r_x2": 400.38, "r_y2": 121.83, "r_x3": 317.06, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 130.75, "r_x1": 425.38, "r_y1": 130.75, "r_x2": 425.38, "r_y2": 121.53, "r_x3": 417.86, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 130.75, "r_x1": 457.42, "r_y1": 130.75, "r_x2": 457.42, "r_y2": 121.53, "r_x3": 449.9, "r_y3": 121.53, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 130.74, "r_x1": 496.33, "r_y1": 130.74, "r_x2": 496.33, "r_y2": 121.83, "r_x3": 476.4, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 130.74, "r_x1": 532.56, "r_y1": 130.74, "r_x2": 532.56, "r_y2": 121.83, "r_x3": 512.63, "r_y3": 121.83, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 142.69, "r_x1": 375.17, "r_y1": 142.69, "r_x2": 375.17, "r_y2": 133.79, "r_x3": 317.06, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 142.7, "r_x1": 425.38, "r_y1": 142.7, "r_x2": 425.38, "r_y2": 133.49, "r_x3": 417.86, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 142.7, "r_x1": 457.42, "r_y1": 142.7, "r_x2": 457.42, "r_y2": 133.49, "r_x3": 449.9, "r_y3": 133.49, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 142.69, "r_x1": 496.33, "r_y1": 142.69, "r_x2": 496.33, "r_y2": 133.79, "r_x3": 476.4, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 142.69, "r_x1": 532.56, "r_y1": 142.69, "r_x2": 532.56, "r_y2": 133.79, "r_x3": 512.63, "r_y3": 133.79, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 317.06, "r_y0": 154.65, "r_x1": 369.39, "r_y1": 154.65, "r_x2": 369.39, "r_y2": 145.74, "r_x3": 317.06, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.86, "r_y0": 154.66, "r_x1": 425.38, "r_y1": 154.66, "r_x2": 425.38, "r_y2": 145.44, "r_x3": 417.86, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.9, "r_y0": 154.66, "r_x1": 457.42, "r_y1": 154.66, "r_x2": 457.42, "r_y2": 145.44, "r_x3": 449.9, "r_y3": 145.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.4, "r_y0": 154.65, "r_x1": 496.33, "r_y1": 154.65, "r_x2": 496.33, "r_y2": 145.74, "r_x3": 476.4, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.63, "r_y0": 154.65, "r_x1": 532.56, "r_y1": 154.65, "r_x2": 532.56, "r_y2": 145.74, "r_x3": 512.63, "r_y3": 145.74, "coord_origin": "TOPLEFT" }, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 412.33, "t": 73.61, "r": 430.9, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 442.86, "t": 73.61, "r": 464.45, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 477.79, "t": 73.61, "r": 494.94, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 508.28, "t": 73.61, "r": 536.91, "b": 82.52, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 85.97, "r": 361.64, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 85.67, "r": 425.38, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 85.67, "r": 457.42, "b": 94.88, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 85.97, "r": 496.33, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 85.97, "r": 532.56, "b": 94.87, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 97.92, "r": 359.43, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 97.62, "r": 425.38, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 97.62, "r": 457.42, "b": 106.84, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 97.92, "r": 496.33, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.46, "t": 97.92, "r": 531.73, "b": 106.83, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 109.88, "r": 359.98, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 109.58, "r": 425.38, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 450.81, "t": 109.58, "r": 456.5, "b": 118.79, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 109.88, "r": 496.33, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 511.25, "t": 109.88, "r": 533.95, "b": 118.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 121.83, "r": 400.38, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 121.53, "r": 425.38, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 121.53, "r": 457.42, "b": 130.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 121.83, "r": 496.33, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 121.83, "r": 532.56, "b": 130.74, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 133.79, "r": 375.17, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 133.49, "r": 425.38, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 133.49, "r": 457.42, "b": 142.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 133.79, "r": 496.33, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 133.79, "r": 532.56, "b": 142.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 317.06, "t": 145.74, "r": 369.39, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 417.86, "t": 145.44, "r": 425.38, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.9, "t": 145.44, "r": 457.42, "b": 154.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 476.4, "t": 145.74, "r": 496.33, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.63, "t": 145.74, "r": 532.56, "b": 154.65, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 9, "page_no": 3, "cluster": { "id": 9, "label": "caption", "bbox": { "l": 308.86, "t": 167.66, "r": 545.12, "b": 224.39, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 176.57, "r_x1": 344.62, "r_y1": 176.57, "r_x2": 344.62, "r_y2": 167.66, "r_x3": 308.86, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Table 1:", "orig": "Table 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.08, "r_y0": 176.57, "r_x1": 380.45, "r_y1": 176.57, "r_x2": 380.45, "r_y2": 167.66, "r_x3": 361.08, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.57, "r_y0": 176.34, "r_x1": 468.68, "r_y1": 176.34, "r_x2": 468.68, "r_y2": 167.75, "r_x3": 386.57, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201cCombined-Tabnet\u201d", "orig": "\u201cCombined-Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.8, "r_y0": 176.57, "r_x1": 489.18, "r_y1": 176.57, "r_x2": 489.18, "r_y2": 167.66, "r_x3": 474.8, "r_y3": 167.66, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.3, "r_y0": 176.34, "r_x1": 545.11, "r_y1": 176.34, "r_x2": 545.11, "r_y2": 167.75, "r_x3": 495.3, "r_y3": 167.75, "coord_origin": "TOPLEFT" }, "text": "\u201dCombined-", "orig": "\u201dCombined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 188.29, "r_x1": 341.16, "r_y1": 188.29, "r_x2": 341.16, "r_y2": 179.71, "r_x3": 308.86, "r_y3": 179.71, "coord_origin": "TOPLEFT" }, "text": "Tabnet\u201d", "orig": "Tabnet\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.46, "r_y0": 188.52, "r_x1": 545.11, "r_y1": 188.52, "r_x2": 545.11, "r_y2": 179.62, "r_x3": 343.46, "r_y3": 179.62, "coord_origin": "TOPLEFT" }, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 200.48, "r_x1": 545.12, "r_y1": 200.48, "r_x2": 545.12, "r_y2": 191.57, "r_x3": 308.86, "r_y3": 191.57, "coord_origin": "TOPLEFT" }, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 212.43, "r_x1": 545.11, "r_y1": 212.43, "r_x2": 545.11, "r_y2": 203.53, "r_x3": 308.86, "r_y3": 203.53, "coord_origin": "TOPLEFT" }, "text": "and Fintabnet. (**) The combined dataset is the processed", "orig": "and Fintabnet. (**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 224.39, "r_x1": 523.93, "r_y1": 224.39, "r_x2": 523.93, "r_y2": 215.48, "r_x3": 308.86, "r_y3": 215.48, "coord_origin": "TOPLEFT" }, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank." }, { "label": "text", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "text", "bbox": { "l": 308.86, "t": 249.62, "r": 545.12, "b": 294.39, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.53, "r_x1": 545.12, "r_y1": 258.53, "r_x2": 545.12, "r_y2": 249.62, "r_x3": 308.86, "r_y3": 249.62, "coord_origin": "TOPLEFT" }, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.48, "r_x1": 545.12, "r_y1": 270.48, "r_x2": 545.12, "r_y2": 261.58, "r_x3": 308.86, "r_y3": 261.58, "coord_origin": "TOPLEFT" }, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.44, "r_x1": 545.12, "r_y1": 282.44, "r_x2": 545.12, "r_y2": 273.53, "r_x3": 308.86, "r_y3": 273.53, "coord_origin": "TOPLEFT" }, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.39, "r_x1": 436.82, "r_y1": 294.39, "r_x2": 436.82, "r_y2": 285.49, "r_x3": 308.86, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples." }, { "label": "text", "id": 13, "page_no": 3, "cluster": { "id": 13, "label": "text", "bbox": { "l": 320.82, "t": 297.77, "r": 542.74, "b": 306.68, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.68, "r_x1": 542.74, "r_y1": 306.68, "r_x2": 542.74, "r_y2": 297.77, "r_x3": 320.82, "r_y3": 297.77, "coord_origin": "TOPLEFT" }, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tab. 1 summarizes the various attributes of the datasets." }, { "label": "section_header", "id": 11, "page_no": 3, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 308.86, "t": 321.18, "r": 444.94, "b": 331.93, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 331.93, "r_x1": 316.28, "r_y1": 331.93, "r_x2": 316.28, "r_y2": 321.18, "r_x3": 308.86, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.18, "r_y0": 331.93, "r_x1": 444.94, "r_y1": 331.93, "r_x2": 444.94, "r_y2": 321.18, "r_x3": 326.18, "r_y3": 321.18, "coord_origin": "TOPLEFT" }, "text": "The TableFormer model", "orig": "The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. The TableFormer model" }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 341.94, "r": 545.12, "b": 446.49, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 350.85, "r_x1": 545.11, "r_y1": 350.85, "r_x2": 545.11, "r_y2": 341.94, "r_x3": 320.82, "r_y3": 341.94, "coord_origin": "TOPLEFT" }, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 362.8, "r_x1": 545.12, "r_y1": 362.8, "r_x2": 545.12, "r_y2": 353.89, "r_x3": 308.86, "r_y3": 353.89, "coord_origin": "TOPLEFT" }, "text": "dict: 1) a sequence of tokens that represent the structure of", "orig": "dict: 1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 374.76, "r_x1": 545.12, "r_y1": 374.76, "r_x2": 545.12, "r_y2": 365.85, "r_x3": 308.86, "r_y3": 365.85, "coord_origin": "TOPLEFT" }, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 386.71, "r_x1": 545.12, "r_y1": 386.71, "r_x2": 545.12, "r_y2": 377.8, "r_x3": 308.86, "r_y3": 377.8, "coord_origin": "TOPLEFT" }, "text": "tokens. The conversion of an image into a sequence of to-", "orig": "tokens. The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 398.67, "r_x1": 545.12, "r_y1": 398.67, "r_x2": 545.12, "r_y2": 389.76, "r_x3": 308.86, "r_y3": 389.76, "coord_origin": "TOPLEFT" }, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 410.62, "r_x1": 545.12, "r_y1": 410.62, "r_x2": 545.12, "r_y2": 401.71, "r_x3": 308.86, "r_y3": 401.71, "coord_origin": "TOPLEFT" }, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 422.58, "r_x1": 545.12, "r_y1": 422.58, "r_x2": 545.12, "r_y2": 413.67, "r_x3": 308.86, "r_y3": 413.67, "coord_origin": "TOPLEFT" }, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 434.53, "r_x1": 545.12, "r_y1": 434.53, "r_x2": 545.12, "r_y2": 425.63, "r_x3": 308.86, "r_y3": 425.63, "coord_origin": "TOPLEFT" }, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 446.49, "r_x1": 437.94, "r_y1": 446.49, "r_x2": 437.94, "r_y2": 437.58, "r_x3": 308.86, "r_y3": 437.58, "coord_origin": "TOPLEFT" }, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required." }, { "label": "section_header", "id": 12, "page_no": 3, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 308.86, "t": 457.69, "r": 420.16, "b": 467.55, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 467.55, "r_x1": 323.14, "r_y1": 467.55, "r_x2": 323.14, "r_y2": 457.69, "r_x3": 308.86, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "4.1.", "orig": "4.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.66, "r_y0": 467.55, "r_x1": 420.16, "r_y1": 467.55, "r_x2": 420.16, "r_y2": 457.69, "r_x3": 332.66, "r_y3": 457.69, "coord_origin": "TOPLEFT" }, "text": "Model architecture.", "orig": "Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1. Model architecture." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 476.77, "r": 545.12, "b": 665.0, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 485.67, "r_x1": 545.11, "r_y1": 485.67, "r_x2": 545.11, "r_y2": 476.77, "r_x3": 320.82, "r_y3": 476.77, "coord_origin": "TOPLEFT" }, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.63, "r_x1": 509.02, "r_y1": 497.63, "r_x2": 509.02, "r_y2": 488.72, "r_x3": 308.86, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "is composed of three main components, see Fig.", "orig": "is composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.59, "r_y0": 497.63, "r_x1": 523.06, "r_y1": 497.63, "r_x2": 523.06, "r_y2": 488.72, "r_x3": 515.59, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.63, "r_x1": 545.12, "r_y1": 497.63, "r_x2": 545.12, "r_y2": 488.72, "r_x3": 529.62, "r_y3": 488.72, "coord_origin": "TOPLEFT" }, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.35, "r_x1": 406.35, "r_y1": 509.35, "r_x2": 406.35, "r_y2": 500.76, "r_x3": 308.86, "r_y3": 500.76, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.87, "r_y0": 509.58, "r_x1": 545.11, "r_y1": 509.58, "r_x2": 545.11, "r_y2": 500.68, "r_x3": 408.87, "r_y3": 500.68, "coord_origin": "TOPLEFT" }, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.54, "r_x1": 409.39, "r_y1": 521.54, "r_x2": 409.39, "r_y2": 512.63, "r_x3": 308.86, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "tor of predefined length.", "orig": "tor of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 416.73, "r_y0": 521.54, "r_x1": 545.12, "r_y1": 521.54, "r_x2": 545.12, "r_y2": 512.63, "r_x3": 416.73, "r_y3": 512.63, "coord_origin": "TOPLEFT" }, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.49, "r_x1": 436.19, "r_y1": 533.49, "r_x2": 436.19, "r_y2": 524.59, "r_x3": 308.86, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 533.26, "r_x1": 513.87, "r_y1": 533.26, "r_x2": 513.87, "r_y2": 524.68, "r_x3": 439.53, "r_y3": 524.68, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 517.43, "r_y0": 533.49, "r_x1": 545.11, "r_y1": 533.49, "r_x2": 545.11, "r_y2": 524.59, "r_x3": 517.43, "r_y3": 524.59, "coord_origin": "TOPLEFT" }, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.45, "r_x1": 545.12, "r_y1": 545.45, "r_x2": 545.12, "r_y2": 536.54, "r_x3": 308.86, "r_y3": 536.54, "coord_origin": "TOPLEFT" }, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.4, "r_x1": 358.55, "r_y1": 557.4, "r_x2": 358.55, "r_y2": 548.5, "r_x3": 308.86, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 365.19, "r_y0": 557.4, "r_x1": 545.12, "r_y1": 557.4, "r_x2": 545.12, "r_y2": 548.5, "r_x3": 365.19, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.36, "r_x1": 352.41, "r_y1": 569.36, "r_x2": 352.41, "r_y2": 560.45, "r_x3": 308.86, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "data cell (\u2018", "orig": "data cell (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.41, "r_y0": 569.14, "r_x1": 360.16, "r_y1": 569.14, "r_x2": 360.16, "r_y2": 560.29, "r_x3": 352.41, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.16, "r_y0": 569.36, "r_x1": 367.91, "r_y1": 569.36, "r_x2": 367.91, "r_y2": 560.45, "r_x3": 360.16, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.91, "r_y0": 569.14, "r_x1": 375.66, "r_y1": 569.14, "r_x2": 375.66, "r_y2": 560.29, "r_x3": 367.91, "r_y3": 560.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.66, "r_y0": 569.36, "r_x1": 545.11, "r_y1": 569.36, "r_x2": 545.11, "r_y2": 560.45, "r_x3": 375.66, "r_y3": 560.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) the hidden state of that cell is passed to", "orig": "\u2019) the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.31, "r_x1": 545.11, "r_y1": 581.31, "r_x2": 545.11, "r_y2": 572.41, "r_x3": 308.86, "r_y3": 572.41, "coord_origin": "TOPLEFT" }, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.27, "r_x1": 483.12, "r_y1": 593.27, "r_x2": 483.12, "r_y2": 584.36, "r_x3": 308.86, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "or column span, the tag is broken down to \u2018", "orig": "or column span, the tag is broken down to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 593.05, "r_x1": 490.87, "r_y1": 593.05, "r_x2": 490.87, "r_y2": 584.2, "r_x3": 483.12, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.87, "r_y0": 593.27, "r_x1": 545.11, "r_y1": 593.27, "r_x2": 545.11, "r_y2": 584.36, "r_x3": 490.87, "r_y3": 584.36, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018rowspan=\u2019", "orig": "\u2019, \u2018rowspan=\u2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.22, "r_x1": 545.11, "r_y1": 605.22, "r_x2": 545.11, "r_y2": 596.32, "r_x3": 308.86, "r_y3": 596.32, "coord_origin": "TOPLEFT" }, "text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.18, "r_x1": 329.64, "r_y1": 617.18, "r_x2": 329.64, "r_y2": 608.27, "r_x3": 308.86, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "and \u2018", "orig": "and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.65, "r_y0": 616.96, "r_x1": 337.39, "r_y1": 616.96, "r_x2": 337.39, "r_y2": 608.11, "r_x3": 329.65, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.39, "r_y0": 617.18, "r_x1": 468.59, "r_y1": 617.18, "r_x2": 468.59, "r_y2": 608.27, "r_x3": 337.39, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019. The hidden state attached to \u2018", "orig": "\u2019. The hidden state attached to \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.59, "r_y0": 616.96, "r_x1": 476.34, "r_y1": 616.96, "r_x2": 476.34, "r_y2": 608.11, "r_x3": 468.59, "r_y3": 608.11, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.34, "r_y0": 617.18, "r_x1": 545.12, "r_y1": 617.18, "r_x2": 545.12, "r_y2": 608.27, "r_x3": 476.34, "r_y3": 608.27, "coord_origin": "TOPLEFT" }, "text": "\u2019 is passed to the", "orig": "\u2019 is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.13, "r_x1": 545.11, "r_y1": 629.13, "r_x2": 545.11, "r_y2": 620.23, "r_x3": 308.86, "r_y3": 620.23, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.09, "r_x1": 545.12, "r_y1": 641.09, "r_x2": 545.12, "r_y2": 632.18, "r_x3": 308.86, "r_y3": 632.18, "coord_origin": "TOPLEFT" }, "text": "receives the hidden states from the Structure Decoder, to", "orig": "receives the hidden states from the Structure Decoder, to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.04, "r_x1": 545.12, "r_y1": 653.04, "r_x2": 545.12, "r_y2": 644.14, "r_x3": 308.86, "r_y3": 644.14, "coord_origin": "TOPLEFT" }, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.0, "r_x1": 449.42, "r_y1": 665.0, "r_x2": 449.42, "r_y2": 656.09, "r_x3": 308.86, "r_y3": 656.09, "coord_origin": "TOPLEFT" }, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification." }, { "label": "text", "id": 7, "page_no": 3, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 668.26, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 677.22, "r_x1": 431.91, "r_y1": 677.22, "r_x2": 431.91, "r_y2": 668.26, "r_x3": 320.82, "r_y3": 668.26, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 677.29, "r_x1": 545.11, "r_y1": 677.29, "r_x2": 545.11, "r_y2": 668.38, "r_x3": 439.5, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.11, "r_y1": 689.24, "r_x2": 545.11, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-" } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 3, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" } ] } }, { "page_no": 4, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.01, "r_x1": 86.88, "r_y1": 213.01, "r_x2": 86.88, "r_y2": 204.11, "r_x3": 50.11, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.02, "r_y0": 212.94, "r_x1": 149.85, "r_y1": 212.94, "r_x2": 149.85, "r_y2": 203.99, "r_x3": 94.02, "r_y3": 203.99, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86, "r_y0": 213.01, "r_x1": 545.11, "r_y1": 213.01, "r_x2": 545.11, "r_y2": 204.11, "r_x3": 152.86, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 224.97, "r_x1": 436.01, "r_y1": 224.97, "r_x2": 436.01, "r_y2": 216.06, "r_x3": 50.11, "r_y3": 216.06, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 536.81, "r_x1": 229.79, "r_y1": 536.81, "r_x2": 229.79, "r_y2": 527.9, "r_x3": 50.11, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.79, "r_y0": 536.74, "r_x1": 267.76, "r_y1": 536.74, "r_x2": 267.76, "r_y2": 527.78, "r_x3": 231.79, "r_y3": 527.78, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76, "r_y0": 536.81, "r_x1": 286.36, "r_y1": 536.81, "r_x2": 286.36, "r_y2": 527.9, "r_x3": 269.76, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 548.76, "r_x1": 286.37, "r_y1": 548.76, "r_x2": 286.37, "r_y2": 539.86, "r_x3": 50.11, "r_y3": 539.86, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 560.72, "r_x1": 205.85, "r_y1": 560.72, "r_x2": 205.85, "r_y2": 551.81, "r_x3": 50.11, "r_y3": 551.81, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.02, "r_y0": 560.65, "r_x1": 286.36, "r_y1": 560.65, "r_x2": 286.36, "r_y2": 551.69, "r_x3": 208.02, "r_y3": 551.69, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 572.67, "r_x1": 64.5, "r_y1": 572.67, "r_x2": 64.5, "r_y2": 563.77, "r_x3": 50.11, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.17, "r_y0": 572.61, "r_x1": 151.31, "r_y1": 572.61, "r_x2": 151.31, "r_y2": 563.65, "r_x3": 68.17, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31, "r_y0": 572.67, "r_x1": 153.8, "r_y1": 572.67, "r_x2": 153.8, "r_y2": 563.77, "r_x3": 151.31, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.42, "r_y0": 572.67, "r_x1": 241.93, "r_y1": 572.67, "r_x2": 241.93, "r_y2": 563.77, "r_x3": 160.42, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.6, "r_y0": 572.61, "r_x1": 286.36, "r_y1": 572.61, "r_x2": 286.36, "r_y2": 563.65, "r_x3": 245.6, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 584.56, "r_x1": 85.52, "r_y1": 584.56, "r_x2": 85.52, "r_y2": 575.6, "r_x3": 50.11, "r_y3": 575.6, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.62, "r_y0": 584.63, "r_x1": 286.36, "r_y1": 584.63, "r_x2": 286.36, "r_y2": 575.72, "r_x3": 88.62, "r_y3": 575.72, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 596.58, "r_x1": 286.37, "r_y1": 596.58, "r_x2": 286.37, "r_y2": 587.68, "r_x3": 50.11, "r_y3": 587.68, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 608.54, "r_x1": 286.37, "r_y1": 608.54, "r_x2": 286.37, "r_y2": 599.63, "r_x3": 50.11, "r_y3": 599.63, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 620.49, "r_x1": 240.44, "r_y1": 620.49, "r_x2": 240.44, "r_y2": 611.59, "r_x3": 50.11, "r_y3": 611.59, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.2, "r_y0": 620.43, "r_x1": 286.37, "r_y1": 620.43, "r_x2": 286.37, "r_y2": 611.47, "r_x3": 243.2, "r_y3": 611.47, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 632.38, "r_x1": 286.37, "r_y1": 632.38, "r_x2": 286.37, "r_y2": 623.42, "r_x3": 50.11, "r_y3": 623.42, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 644.34, "r_x1": 286.37, "r_y1": 644.34, "r_x2": 286.37, "r_y2": 635.38, "r_x3": 50.11, "r_y3": 635.38, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 656.36, "r_x1": 220.58, "r_y1": 656.36, "r_x2": 220.58, "r_y2": 647.45, "r_x3": 50.11, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.58, "r_y0": 656.14, "r_x1": 228.33, "r_y1": 656.14, "r_x2": 228.33, "r_y2": 647.29, "r_x3": 220.58, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.33, "r_y0": 656.36, "r_x1": 236.08, "r_y1": 656.36, "r_x2": 236.08, "r_y2": 647.45, "r_x3": 228.33, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.08, "r_y0": 656.14, "r_x1": 243.83, "r_y1": 656.14, "r_x2": 243.83, "r_y2": 647.29, "r_x3": 236.08, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.83, "r_y0": 656.36, "r_x1": 255.29, "r_y1": 656.36, "r_x2": 255.29, "r_y2": 647.45, "r_x3": 243.83, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29, "r_y0": 656.14, "r_x1": 263.04, "r_y1": 656.14, "r_x2": 263.04, "r_y2": 647.29, "r_x3": 255.29, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04, "r_y0": 656.36, "r_x1": 286.36, "r_y1": 656.36, "r_x2": 286.36, "r_y2": 647.45, "r_x3": 263.04, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 668.32, "r_x1": 286.37, "r_y1": 668.32, "r_x2": 286.37, "r_y2": 659.41, "r_x3": 50.11, "r_y3": 659.41, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 680.27, "r_x1": 218.47, "r_y1": 680.27, "r_x2": 218.47, "r_y2": 671.36, "r_x3": 50.11, "r_y3": 671.36, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.44, "r_x1": 523.06, "r_y1": 258.44, "r_x2": 523.06, "r_y2": 249.53, "r_x3": 308.86, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.2, "r_y0": 258.44, "r_x1": 545.12, "r_y1": 258.44, "r_x2": 545.12, "r_y2": 249.53, "r_x3": 525.2, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.4, "r_x1": 517.56, "r_y1": 270.4, "r_x2": 517.56, "r_y2": 261.49, "r_x3": 308.86, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 270.4, "r_x1": 545.11, "r_y1": 270.4, "r_x2": 545.11, "r_y2": 261.49, "r_x3": 520.77, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.35, "r_x1": 534.8, "r_y1": 282.35, "r_x2": 534.8, "r_y2": 273.45, "r_x3": 308.86, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36, "r_y0": 282.35, "r_x1": 545.12, "r_y1": 282.35, "r_x2": 545.12, "r_y2": 273.45, "r_x3": 537.36, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.31, "r_x1": 341.24, "r_y1": 294.31, "r_x2": 341.24, "r_y2": 285.4, "r_x3": 308.86, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73, "r_y0": 294.08, "r_x1": 417.24, "r_y1": 294.08, "r_x2": 417.24, "r_y2": 285.49, "r_x3": 343.73, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23, "r_y0": 294.31, "r_x1": 436.6, "r_y1": 294.31, "r_x2": 436.6, "r_y2": 285.4, "r_x3": 417.23, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09, "r_y0": 294.08, "r_x1": 516.56, "r_y1": 294.08, "r_x2": 516.56, "r_y2": 285.49, "r_x3": 439.09, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56, "r_y0": 294.31, "r_x1": 519.05, "r_y1": 294.31, "r_x2": 519.05, "r_y2": 285.4, "r_x3": 516.56, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.3, "r_x1": 400.87, "r_y1": 306.3, "r_x2": 400.87, "r_y2": 297.34, "r_x3": 320.82, "r_y3": 297.34, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91, "r_y0": 306.37, "r_x1": 528.34, "r_y1": 306.37, "r_x2": 528.34, "r_y2": 297.46, "r_x3": 403.91, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72, "r_y0": 306.37, "r_x1": 545.11, "r_y1": 306.37, "r_x2": 545.11, "r_y2": 297.46, "r_x3": 530.72, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.32, "r_x1": 517.53, "r_y1": 318.32, "r_x2": 517.53, "r_y2": 309.41, "r_x3": 308.86, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09, "r_y0": 318.32, "r_x1": 545.11, "r_y1": 318.32, "r_x2": 545.11, "r_y2": 309.41, "r_x3": 524.09, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.28, "r_x1": 432.36, "r_y1": 330.28, "r_x2": 432.36, "r_y2": 321.37, "r_x3": 308.86, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.82, "r_y0": 330.05, "r_x1": 510.29, "r_y1": 330.05, "r_x2": 510.29, "r_y2": 321.46, "r_x3": 435.82, "r_y3": 321.46, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.98, "r_y0": 330.28, "r_x1": 520.62, "r_y1": 330.28, "r_x2": 520.62, "r_y2": 321.37, "r_x3": 513.98, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08, "r_y0": 330.28, "r_x1": 545.11, "r_y1": 330.28, "r_x2": 545.11, "r_y2": 321.37, "r_x3": 524.08, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 342.23, "r_x1": 527.76, "r_y1": 342.23, "r_x2": 527.76, "r_y2": 333.32, "r_x3": 308.86, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 342.23, "r_x1": 545.11, "r_y1": 342.23, "r_x2": 545.11, "r_y2": 333.32, "r_x3": 530.73, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.19, "r_x1": 526.85, "r_y1": 354.19, "r_x2": 526.85, "r_y2": 345.28, "r_x3": 308.86, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 354.19, "r_x1": 545.11, "r_y1": 354.19, "r_x2": 545.11, "r_y2": 345.28, "r_x3": 529.62, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.14, "r_x1": 524.51, "r_y1": 366.14, "r_x2": 524.51, "r_y2": 357.24, "r_x3": 308.86, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.97, "r_y0": 366.14, "r_x1": 545.12, "r_y1": 366.14, "r_x2": 545.12, "r_y2": 357.24, "r_x3": 527.97, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.1, "r_x1": 370.39, "r_y1": 378.1, "r_x2": 370.39, "r_y2": 369.19, "r_x3": 308.86, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44, "r_y0": 378.1, "r_x1": 526.91, "r_y1": 378.1, "r_x2": 526.91, "r_y2": 369.19, "r_x3": 377.44, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 378.1, "r_x1": 545.12, "r_y1": 378.1, "r_x2": 545.12, "r_y2": 369.19, "r_x3": 530.73, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.05, "r_x1": 505.46, "r_y1": 390.05, "r_x2": 505.46, "r_y2": 381.15, "r_x3": 308.86, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03, "r_y0": 390.05, "r_x1": 545.12, "r_y1": 390.05, "r_x2": 545.12, "r_y2": 381.15, "r_x3": 508.03, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.01, "r_x1": 517.69, "r_y1": 402.01, "r_x2": 517.69, "r_y2": 393.1, "r_x3": 308.86, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 402.01, "r_x1": 545.11, "r_y1": 402.01, "r_x2": 545.11, "r_y2": 393.1, "r_x3": 520.77, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 413.96, "r_x1": 528.02, "r_y1": 413.96, "r_x2": 528.02, "r_y2": 405.06, "r_x3": 308.86, "r_y3": 405.06, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 426.02, "r_x1": 515.5, "r_y1": 426.02, "r_x2": 515.5, "r_y2": 417.11, "r_x3": 320.82, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 426.02, "r_x1": 545.11, "r_y1": 426.02, "r_x2": 545.11, "r_y2": 417.11, "r_x3": 520.77, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 437.98, "r_x1": 343.72, "r_y1": 437.98, "r_x2": 343.72, "r_y2": 429.07, "r_x3": 308.86, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.04, "r_y0": 437.75, "r_x1": 446.45, "r_y1": 437.75, "r_x2": 446.45, "r_y2": 429.16, "r_x3": 347.04, "r_y3": 429.16, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.94, "r_y0": 437.98, "r_x1": 503.06, "r_y1": 437.98, "r_x2": 503.06, "r_y2": 429.07, "r_x3": 449.94, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.38, "r_y0": 437.98, "r_x1": 537.37, "r_y1": 437.98, "r_x2": 537.37, "r_y2": 429.07, "r_x3": 506.38, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.69, "r_y0": 437.98, "r_x1": 545.11, "r_y1": 437.98, "r_x2": 545.11, "r_y2": 429.07, "r_x3": 540.69, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 449.93, "r_x1": 522.79, "r_y1": 449.93, "r_x2": 522.79, "r_y2": 441.02, "r_x3": 308.86, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.75, "r_y0": 449.93, "r_x1": 545.12, "r_y1": 449.93, "r_x2": 545.12, "r_y2": 441.02, "r_x3": 525.75, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 461.89, "r_x1": 384.15, "r_y1": 461.89, "r_x2": 384.15, "r_y2": 452.98, "r_x3": 308.86, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37, "r_y0": 461.89, "r_x1": 527.85, "r_y1": 461.89, "r_x2": 527.85, "r_y2": 452.98, "r_x3": 393.37, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39, "r_y0": 461.89, "r_x1": 545.12, "r_y1": 461.89, "r_x2": 545.12, "r_y2": 452.98, "r_x3": 532.39, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.84, "r_x1": 529.76, "r_y1": 473.84, "r_x2": 529.76, "r_y2": 464.94, "r_x3": 308.86, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94, "r_y0": 473.84, "r_x1": 545.12, "r_y1": 473.84, "r_x2": 545.12, "r_y2": 464.94, "r_x3": 532.94, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.8, "r_x1": 514.17, "r_y1": 485.8, "r_x2": 514.17, "r_y2": 476.89, "r_x3": 308.86, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89, "r_y0": 485.8, "r_x1": 545.12, "r_y1": 485.8, "r_x2": 545.12, "r_y2": 476.89, "r_x3": 516.89, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.75, "r_x1": 527.63, "r_y1": 497.75, "r_x2": 527.63, "r_y2": 488.85, "r_x3": 308.86, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.75, "r_x1": 545.11, "r_y1": 497.75, "r_x2": 545.11, "r_y2": 488.85, "r_x3": 529.62, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.71, "r_x1": 508.36, "r_y1": 509.71, "r_x2": 508.36, "r_y2": 500.8, "r_x3": 308.86, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09, "r_y0": 509.71, "r_x1": 545.12, "r_y1": 509.71, "r_x2": 545.12, "r_y2": 500.8, "r_x3": 511.09, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.66, "r_x1": 545.11, "r_y1": 521.66, "r_x2": 545.11, "r_y2": 512.76, "r_x3": 308.86, "r_y3": 512.76, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.62, "r_x1": 545.12, "r_y1": 533.62, "r_x2": 545.12, "r_y2": 524.71, "r_x3": 308.86, "r_y3": 524.71, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.57, "r_x1": 369.73, "r_y1": 545.57, "r_x2": 369.73, "r_y2": 536.67, "r_x3": 308.86, "r_y3": 536.67, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 557.56, "r_x1": 404.76, "r_y1": 557.56, "r_x2": 404.76, "r_y2": 548.6, "r_x3": 320.82, "r_y3": 548.6, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34, "r_y0": 557.63, "r_x1": 545.12, "r_y1": 557.63, "r_x2": 545.12, "r_y2": 548.72, "r_x3": 410.34, "r_y3": 548.72, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.59, "r_x1": 545.11, "r_y1": 569.59, "r_x2": 545.11, "r_y2": 560.68, "r_x3": 308.86, "r_y3": 560.68, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.54, "r_x1": 545.12, "r_y1": 581.54, "r_x2": 545.12, "r_y2": 572.64, "r_x3": 308.86, "r_y3": 572.64, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.5, "r_x1": 545.11, "r_y1": 593.5, "r_x2": 545.11, "r_y2": 584.59, "r_x3": 308.86, "r_y3": 584.59, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.45, "r_x1": 545.11, "r_y1": 605.45, "r_x2": 545.11, "r_y2": 596.55, "r_x3": 308.86, "r_y3": 596.55, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.41, "r_x1": 545.12, "r_y1": 617.41, "r_x2": 545.12, "r_y2": 608.5, "r_x3": 308.86, "r_y3": 608.5, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.36, "r_x1": 545.12, "r_y1": 629.36, "r_x2": 545.12, "r_y2": 620.46, "r_x3": 308.86, "r_y3": 620.46, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.32, "r_x1": 381.68, "r_y1": 641.32, "r_x2": 381.68, "r_y2": 632.41, "r_x3": 308.86, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0, "r_y0": 641.1, "r_x1": 391.75, "r_y1": 641.1, "r_x2": 391.75, "r_y2": 632.25, "r_x3": 384.0, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.75, "r_y0": 641.32, "r_x1": 399.5, "r_y1": 641.32, "r_x2": 399.5, "r_y2": 632.41, "r_x3": 391.75, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.5, "r_y0": 641.1, "r_x1": 407.25, "r_y1": 641.1, "r_x2": 407.25, "r_y2": 632.25, "r_x3": 399.5, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.25, "r_y0": 641.32, "r_x1": 432.91, "r_y1": 641.32, "r_x2": 432.91, "r_y2": 632.41, "r_x3": 407.25, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.91, "r_y0": 641.1, "r_x1": 440.66, "r_y1": 641.1, "r_x2": 440.66, "r_y2": 632.25, "r_x3": 432.91, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.66, "r_y0": 641.32, "r_x1": 545.11, "r_y1": 641.32, "r_x2": 545.11, "r_y2": 632.41, "r_x3": 440.66, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.27, "r_x1": 398.96, "r_y1": 653.27, "r_x2": 398.96, "r_y2": 644.37, "r_x3": 308.86, "r_y3": 644.37, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 665.33, "r_x1": 444.34, "r_y1": 665.33, "r_x2": 444.34, "r_y2": 656.43, "r_x3": 320.82, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.01, "r_y0": 665.1, "r_x1": 545.11, "r_y1": 665.1, "r_x2": 545.11, "r_y2": 656.51, "r_x3": 447.01, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "picture", "bbox": { "l": 74.31, "t": 77.91, "r": 519.98, "b": 183.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.69, "t": 122.44, "r": 84.93, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.55, "t": 122.44, "r": 93.03, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.5, "t": 115.25, "r": 115.35, "b": 118.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.14, "t": 115.21, "r": 93.29, "b": 118.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.75, "t": 122.44, "r": 104.31, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.75, "t": 127.74, "r": 102.42, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.75, "t": 133.46, "r": 104.31, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.75, "t": 139.17, "r": 102.42, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66, "t": 122.44, "r": 116.14, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66, "t": 127.74, "r": 116.14, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66, "t": 133.46, "r": 116.14, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66, "t": 139.17, "r": 116.14, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.69, "t": 127.74, "r": 84.93, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.55, "t": 127.74, "r": 93.03, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.69, "t": 133.46, "r": 84.93, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.55, "t": 133.46, "r": 93.03, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.69, "t": 139.17, "r": 84.93, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.55, "t": 139.17, "r": 93.03, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.08, "t": 90.5, "r": 113.94, "b": 96.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81, "t": 97.64, "r": 119.21, "b": 103.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94, "t": 100.6, "r": 180.01, "b": 106.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94, "t": 107.74, "r": 172.01, "b": 113.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.77, "t": 80.93, "r": 266.4, "b": 86.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.52, "t": 86.03, "r": 270.65, "b": 91.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.04, "t": 78.56, "r": 352.13, "b": 84.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56, "t": 96.03, "r": 431.73, "b": 101.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82, "t": 102.15, "r": 435.47, "b": 107.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.7, "t": 108.27, "r": 433.6, "b": 114.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.08, "t": 114.39, "r": 431.23, "b": 120.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.23, "t": 151.69, "r": 498.82, "b": 157.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.17, "t": 157.81, "r": 498.88, "b": 163.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.53, "t": 163.93, "r": 489.52, "b": 169.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37, "t": 178.25, "r": 367.72, "b": 183.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84, "t": 123.91, "r": 373.68, "b": 129.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84, "t": 129.01, "r": 381.18, "b": 134.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.63, "t": 88.12, "r": 219.42, "b": 93.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.67, "t": 129.49, "r": 271.5, "b": 135.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.52, "t": 134.59, "r": 270.65, "b": 140.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63, "t": 89.02, "r": 365.55, "b": 94.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63, "t": 97.18, "r": 370.23, "b": 102.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63, "t": 105.34, "r": 374.51, "b": 111.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63, "t": 113.5, "r": 335.73, "b": 119.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.31, "t": 141.79, "r": 335.06, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.31, "t": 148.93, "r": 335.06, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.55, "t": 148.56, "r": 340.95, "b": 154.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56, "t": 148.93, "r": 398.91, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.42, "t": 148.93, "r": 421.59, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.31, "t": 156.07, "r": 349.23, "b": 160.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.31, "t": 163.21, "r": 335.06, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56, "t": 163.21, "r": 374.74, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.31, "t": 170.35, "r": 326.56, "b": 175.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51, "t": 89.67, "r": 326.91, "b": 95.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.72, "t": 97.79, "r": 327.12, "b": 103.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.72, "t": 105.99, "r": 327.12, "b": 111.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.48, "t": 148.55, "r": 404.88, "b": 154.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.7, "t": 162.68, "r": 341.1, "b": 168.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46, "t": 104.55, "r": 457.87, "b": 110.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.33, "t": 91.1, "r": 496.73, "b": 96.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08, "t": 90.57, "r": 457.49, "b": 96.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 203.99, "r": 545.11, "b": 224.97, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.01, "r_x1": 86.88, "r_y1": 213.01, "r_x2": 86.88, "r_y2": 204.11, "r_x3": 50.11, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.02, "r_y0": 212.94, "r_x1": 149.85, "r_y1": 212.94, "r_x2": 149.85, "r_y2": 203.99, "r_x3": 94.02, "r_y3": 203.99, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86, "r_y0": 213.01, "r_x1": 545.11, "r_y1": 213.01, "r_x2": 545.11, "r_y2": 204.11, "r_x3": 152.86, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 224.97, "r_x1": 436.01, "r_y1": 224.97, "r_x2": 436.01, "r_y2": 216.06, "r_x3": 50.11, "r_y3": 216.06, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "picture", "bbox": { "l": 53.03, "t": 257.67, "r": 285.37, "b": 507.67, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.25, "t": 258.21, "r": 101.76, "b": 264.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.3, "t": 258.35, "r": 157.84, "b": 264.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.55, "t": 371.39, "r": 125.68, "b": 377.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.51, "t": 391.32, "r": 84.64, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.53, "t": 391.32, "r": 125.11, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.02, "t": 424.45, "r": 127.92, "b": 430.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.38, "t": 444.89, "r": 84.51, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.4, "t": 444.89, "r": 124.98, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.47, "t": 462.44, "r": 181.63, "b": 468.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61, "t": 478.47, "r": 184.43, "b": 484.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.32, "t": 324.26, "r": 132.92, "b": 330.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51, "t": 269.66, "r": 162.99, "b": 274.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.73, "t": 274.91, "r": 151.41, "b": 279.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.43, "t": 338.96, "r": 80.27, "b": 344.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.6, "t": 343.39, "r": 78.85, "b": 348.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.83, "t": 293.38, "r": 154.66, "b": 298.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99, "t": 297.8, "r": 153.25, "b": 303.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55, "t": 345.36, "r": 197.15, "b": 351.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55, "t": 394.42, "r": 156.68, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.57, "t": 394.42, "r": 197.15, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.19, "t": 375.67, "r": 197.32, "b": 381.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55, "t": 440.25, "r": 156.68, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.57, "t": 440.25, "r": 197.15, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86, "t": 422.09, "r": 199.76, "b": 427.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.57, "t": 314.26, "r": 255.73, "b": 319.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.92, "t": 361.36, "r": 256.08, "b": 367.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.05, "t": 336.62, "r": 248.72, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.29, "t": 336.62, "r": 269.39, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.45, "t": 405.15, "r": 238.74, "b": 410.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.3, "t": 405.2, "r": 271.78, "b": 410.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.55, "t": 382.21, "r": 258.09, "b": 387.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.15, "t": 384.87, "r": 59.51, "b": 449.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.24, "t": 373.81, "r": 59.3, "b": 378.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.3, "t": 484.53, "r": 122.16, "b": 490.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.67, "t": 279.55, "r": 265.32, "b": 285.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17, "t": 500.3, "r": 190.42, "b": 506.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.82, "t": 438.06, "r": 270.78, "b": 443.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.7, "t": 444.06, "r": 263.51, "b": 449.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.75, "t": 293.4, "r": 212.16, "b": 298.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91, "t": 299.15, "r": 216.74, "b": 304.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.25, "t": 282.78, "r": 198.89, "b": 287.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.46, "t": 271.87, "r": 276.47, "b": 277.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65, "t": 323.44, "r": 197.29, "b": 329.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43, "t": 329.44, "r": 184.19, "b": 335.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 8, "label": "caption", "bbox": { "l": 50.11, "t": 527.78, "r": 286.37, "b": 680.27, "coord_origin": "TOPLEFT" }, "confidence": 0.891, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 536.81, "r_x1": 229.79, "r_y1": 536.81, "r_x2": 229.79, "r_y2": 527.9, "r_x3": 50.11, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.79, "r_y0": 536.74, "r_x1": 267.76, "r_y1": 536.74, "r_x2": 267.76, "r_y2": 527.78, "r_x3": 231.79, "r_y3": 527.78, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76, "r_y0": 536.81, "r_x1": 286.36, "r_y1": 536.81, "r_x2": 286.36, "r_y2": 527.9, "r_x3": 269.76, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 548.76, "r_x1": 286.37, "r_y1": 548.76, "r_x2": 286.37, "r_y2": 539.86, "r_x3": 50.11, "r_y3": 539.86, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 560.72, "r_x1": 205.85, "r_y1": 560.72, "r_x2": 205.85, "r_y2": 551.81, "r_x3": 50.11, "r_y3": 551.81, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.02, "r_y0": 560.65, "r_x1": 286.36, "r_y1": 560.65, "r_x2": 286.36, "r_y2": 551.69, "r_x3": 208.02, "r_y3": 551.69, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 572.67, "r_x1": 64.5, "r_y1": 572.67, "r_x2": 64.5, "r_y2": 563.77, "r_x3": 50.11, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.17, "r_y0": 572.61, "r_x1": 151.31, "r_y1": 572.61, "r_x2": 151.31, "r_y2": 563.65, "r_x3": 68.17, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31, "r_y0": 572.67, "r_x1": 153.8, "r_y1": 572.67, "r_x2": 153.8, "r_y2": 563.77, "r_x3": 151.31, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.42, "r_y0": 572.67, "r_x1": 241.93, "r_y1": 572.67, "r_x2": 241.93, "r_y2": 563.77, "r_x3": 160.42, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.6, "r_y0": 572.61, "r_x1": 286.36, "r_y1": 572.61, "r_x2": 286.36, "r_y2": 563.65, "r_x3": 245.6, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 584.56, "r_x1": 85.52, "r_y1": 584.56, "r_x2": 85.52, "r_y2": 575.6, "r_x3": 50.11, "r_y3": 575.6, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.62, "r_y0": 584.63, "r_x1": 286.36, "r_y1": 584.63, "r_x2": 286.36, "r_y2": 575.72, "r_x3": 88.62, "r_y3": 575.72, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 596.58, "r_x1": 286.37, "r_y1": 596.58, "r_x2": 286.37, "r_y2": 587.68, "r_x3": 50.11, "r_y3": 587.68, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 608.54, "r_x1": 286.37, "r_y1": 608.54, "r_x2": 286.37, "r_y2": 599.63, "r_x3": 50.11, "r_y3": 599.63, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 620.49, "r_x1": 240.44, "r_y1": 620.49, "r_x2": 240.44, "r_y2": 611.59, "r_x3": 50.11, "r_y3": 611.59, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.2, "r_y0": 620.43, "r_x1": 286.37, "r_y1": 620.43, "r_x2": 286.37, "r_y2": 611.47, "r_x3": 243.2, "r_y3": 611.47, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 632.38, "r_x1": 286.37, "r_y1": 632.38, "r_x2": 286.37, "r_y2": 623.42, "r_x3": 50.11, "r_y3": 623.42, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 644.34, "r_x1": 286.37, "r_y1": 644.34, "r_x2": 286.37, "r_y2": 635.38, "r_x3": 50.11, "r_y3": 635.38, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 656.36, "r_x1": 220.58, "r_y1": 656.36, "r_x2": 220.58, "r_y2": 647.45, "r_x3": 50.11, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.58, "r_y0": 656.14, "r_x1": 228.33, "r_y1": 656.14, "r_x2": 228.33, "r_y2": 647.29, "r_x3": 220.58, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.33, "r_y0": 656.36, "r_x1": 236.08, "r_y1": 656.36, "r_x2": 236.08, "r_y2": 647.45, "r_x3": 228.33, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.08, "r_y0": 656.14, "r_x1": 243.83, "r_y1": 656.14, "r_x2": 243.83, "r_y2": 647.29, "r_x3": 236.08, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.83, "r_y0": 656.36, "r_x1": 255.29, "r_y1": 656.36, "r_x2": 255.29, "r_y2": 647.45, "r_x3": 243.83, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29, "r_y0": 656.14, "r_x1": 263.04, "r_y1": 656.14, "r_x2": 263.04, "r_y2": 647.29, "r_x3": 255.29, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04, "r_y0": 656.36, "r_x1": 286.36, "r_y1": 656.36, "r_x2": 286.36, "r_y2": 647.45, "r_x3": 263.04, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 668.32, "r_x1": 286.37, "r_y1": 668.32, "r_x2": 286.37, "r_y2": 659.41, "r_x3": 50.11, "r_y3": 659.41, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 680.27, "r_x1": 218.47, "r_y1": 680.27, "r_x2": 218.47, "r_y2": 671.36, "r_x3": 50.11, "r_y3": 671.36, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 249.53, "r": 545.12, "b": 294.31, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.44, "r_x1": 523.06, "r_y1": 258.44, "r_x2": 523.06, "r_y2": 249.53, "r_x3": 308.86, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.2, "r_y0": 258.44, "r_x1": 545.12, "r_y1": 258.44, "r_x2": 545.12, "r_y2": 249.53, "r_x3": 525.2, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.4, "r_x1": 517.56, "r_y1": 270.4, "r_x2": 517.56, "r_y2": 261.49, "r_x3": 308.86, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 270.4, "r_x1": 545.11, "r_y1": 270.4, "r_x2": 545.11, "r_y2": 261.49, "r_x3": 520.77, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.35, "r_x1": 534.8, "r_y1": 282.35, "r_x2": 534.8, "r_y2": 273.45, "r_x3": 308.86, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36, "r_y0": 282.35, "r_x1": 545.12, "r_y1": 282.35, "r_x2": 545.12, "r_y2": 273.45, "r_x3": 537.36, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.31, "r_x1": 341.24, "r_y1": 294.31, "r_x2": 341.24, "r_y2": 285.4, "r_x3": 308.86, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73, "r_y0": 294.08, "r_x1": 417.24, "r_y1": 294.08, "r_x2": 417.24, "r_y2": 285.49, "r_x3": 343.73, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23, "r_y0": 294.31, "r_x1": 436.6, "r_y1": 294.31, "r_x2": 436.6, "r_y2": 285.4, "r_x3": 417.23, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09, "r_y0": 294.08, "r_x1": 516.56, "r_y1": 294.08, "r_x2": 516.56, "r_y2": 285.49, "r_x3": 439.09, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56, "r_y0": 294.31, "r_x1": 519.05, "r_y1": 294.31, "r_x2": 519.05, "r_y2": 285.4, "r_x3": 516.56, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 297.34, "r": 545.12, "b": 413.96, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.3, "r_x1": 400.87, "r_y1": 306.3, "r_x2": 400.87, "r_y2": 297.34, "r_x3": 320.82, "r_y3": 297.34, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91, "r_y0": 306.37, "r_x1": 528.34, "r_y1": 306.37, "r_x2": 528.34, "r_y2": 297.46, "r_x3": 403.91, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72, "r_y0": 306.37, "r_x1": 545.11, "r_y1": 306.37, "r_x2": 545.11, "r_y2": 297.46, "r_x3": 530.72, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.32, "r_x1": 517.53, "r_y1": 318.32, "r_x2": 517.53, "r_y2": 309.41, "r_x3": 308.86, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09, "r_y0": 318.32, "r_x1": 545.11, "r_y1": 318.32, "r_x2": 545.11, "r_y2": 309.41, "r_x3": 524.09, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.28, "r_x1": 432.36, "r_y1": 330.28, "r_x2": 432.36, "r_y2": 321.37, "r_x3": 308.86, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.82, "r_y0": 330.05, "r_x1": 510.29, "r_y1": 330.05, "r_x2": 510.29, "r_y2": 321.46, "r_x3": 435.82, "r_y3": 321.46, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.98, "r_y0": 330.28, "r_x1": 520.62, "r_y1": 330.28, "r_x2": 520.62, "r_y2": 321.37, "r_x3": 513.98, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08, "r_y0": 330.28, "r_x1": 545.11, "r_y1": 330.28, "r_x2": 545.11, "r_y2": 321.37, "r_x3": 524.08, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 342.23, "r_x1": 527.76, "r_y1": 342.23, "r_x2": 527.76, "r_y2": 333.32, "r_x3": 308.86, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 342.23, "r_x1": 545.11, "r_y1": 342.23, "r_x2": 545.11, "r_y2": 333.32, "r_x3": 530.73, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.19, "r_x1": 526.85, "r_y1": 354.19, "r_x2": 526.85, "r_y2": 345.28, "r_x3": 308.86, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 354.19, "r_x1": 545.11, "r_y1": 354.19, "r_x2": 545.11, "r_y2": 345.28, "r_x3": 529.62, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.14, "r_x1": 524.51, "r_y1": 366.14, "r_x2": 524.51, "r_y2": 357.24, "r_x3": 308.86, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.97, "r_y0": 366.14, "r_x1": 545.12, "r_y1": 366.14, "r_x2": 545.12, "r_y2": 357.24, "r_x3": 527.97, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.1, "r_x1": 370.39, "r_y1": 378.1, "r_x2": 370.39, "r_y2": 369.19, "r_x3": 308.86, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44, "r_y0": 378.1, "r_x1": 526.91, "r_y1": 378.1, "r_x2": 526.91, "r_y2": 369.19, "r_x3": 377.44, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 378.1, "r_x1": 545.12, "r_y1": 378.1, "r_x2": 545.12, "r_y2": 369.19, "r_x3": 530.73, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.05, "r_x1": 505.46, "r_y1": 390.05, "r_x2": 505.46, "r_y2": 381.15, "r_x3": 308.86, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03, "r_y0": 390.05, "r_x1": 545.12, "r_y1": 390.05, "r_x2": 545.12, "r_y2": 381.15, "r_x3": 508.03, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.01, "r_x1": 517.69, "r_y1": 402.01, "r_x2": 517.69, "r_y2": 393.1, "r_x3": 308.86, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 402.01, "r_x1": 545.11, "r_y1": 402.01, "r_x2": 545.11, "r_y2": 393.1, "r_x3": 520.77, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 413.96, "r_x1": 528.02, "r_y1": 413.96, "r_x2": 528.02, "r_y2": 405.06, "r_x3": 308.86, "r_y3": 405.06, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 417.11, "r": 545.12, "b": 545.57, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 426.02, "r_x1": 515.5, "r_y1": 426.02, "r_x2": 515.5, "r_y2": 417.11, "r_x3": 320.82, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 426.02, "r_x1": 545.11, "r_y1": 426.02, "r_x2": 545.11, "r_y2": 417.11, "r_x3": 520.77, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 437.98, "r_x1": 343.72, "r_y1": 437.98, "r_x2": 343.72, "r_y2": 429.07, "r_x3": 308.86, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.04, "r_y0": 437.75, "r_x1": 446.45, "r_y1": 437.75, "r_x2": 446.45, "r_y2": 429.16, "r_x3": 347.04, "r_y3": 429.16, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.94, "r_y0": 437.98, "r_x1": 503.06, "r_y1": 437.98, "r_x2": 503.06, "r_y2": 429.07, "r_x3": 449.94, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.38, "r_y0": 437.98, "r_x1": 537.37, "r_y1": 437.98, "r_x2": 537.37, "r_y2": 429.07, "r_x3": 506.38, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.69, "r_y0": 437.98, "r_x1": 545.11, "r_y1": 437.98, "r_x2": 545.11, "r_y2": 429.07, "r_x3": 540.69, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 449.93, "r_x1": 522.79, "r_y1": 449.93, "r_x2": 522.79, "r_y2": 441.02, "r_x3": 308.86, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.75, "r_y0": 449.93, "r_x1": 545.12, "r_y1": 449.93, "r_x2": 545.12, "r_y2": 441.02, "r_x3": 525.75, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 461.89, "r_x1": 384.15, "r_y1": 461.89, "r_x2": 384.15, "r_y2": 452.98, "r_x3": 308.86, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37, "r_y0": 461.89, "r_x1": 527.85, "r_y1": 461.89, "r_x2": 527.85, "r_y2": 452.98, "r_x3": 393.37, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39, "r_y0": 461.89, "r_x1": 545.12, "r_y1": 461.89, "r_x2": 545.12, "r_y2": 452.98, "r_x3": 532.39, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.84, "r_x1": 529.76, "r_y1": 473.84, "r_x2": 529.76, "r_y2": 464.94, "r_x3": 308.86, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94, "r_y0": 473.84, "r_x1": 545.12, "r_y1": 473.84, "r_x2": 545.12, "r_y2": 464.94, "r_x3": 532.94, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.8, "r_x1": 514.17, "r_y1": 485.8, "r_x2": 514.17, "r_y2": 476.89, "r_x3": 308.86, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89, "r_y0": 485.8, "r_x1": 545.12, "r_y1": 485.8, "r_x2": 545.12, "r_y2": 476.89, "r_x3": 516.89, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.75, "r_x1": 527.63, "r_y1": 497.75, "r_x2": 527.63, "r_y2": 488.85, "r_x3": 308.86, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.75, "r_x1": 545.11, "r_y1": 497.75, "r_x2": 545.11, "r_y2": 488.85, "r_x3": 529.62, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.71, "r_x1": 508.36, "r_y1": 509.71, "r_x2": 508.36, "r_y2": 500.8, "r_x3": 308.86, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09, "r_y0": 509.71, "r_x1": 545.12, "r_y1": 509.71, "r_x2": 545.12, "r_y2": 500.8, "r_x3": 511.09, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.66, "r_x1": 545.11, "r_y1": 521.66, "r_x2": 545.11, "r_y2": 512.76, "r_x3": 308.86, "r_y3": 512.76, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.62, "r_x1": 545.12, "r_y1": 533.62, "r_x2": 545.12, "r_y2": 524.71, "r_x3": 308.86, "r_y3": 524.71, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.57, "r_x1": 369.73, "r_y1": 545.57, "r_x2": 369.73, "r_y2": 536.67, "r_x3": 308.86, "r_y3": 536.67, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 548.6, "r": 545.12, "b": 653.27, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 557.56, "r_x1": 404.76, "r_y1": 557.56, "r_x2": 404.76, "r_y2": 548.6, "r_x3": 320.82, "r_y3": 548.6, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34, "r_y0": 557.63, "r_x1": 545.12, "r_y1": 557.63, "r_x2": 545.12, "r_y2": 548.72, "r_x3": 410.34, "r_y3": 548.72, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.59, "r_x1": 545.11, "r_y1": 569.59, "r_x2": 545.11, "r_y2": 560.68, "r_x3": 308.86, "r_y3": 560.68, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.54, "r_x1": 545.12, "r_y1": 581.54, "r_x2": 545.12, "r_y2": 572.64, "r_x3": 308.86, "r_y3": 572.64, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.5, "r_x1": 545.11, "r_y1": 593.5, "r_x2": 545.11, "r_y2": 584.59, "r_x3": 308.86, "r_y3": 584.59, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.45, "r_x1": 545.11, "r_y1": 605.45, "r_x2": 545.11, "r_y2": 596.55, "r_x3": 308.86, "r_y3": 596.55, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.41, "r_x1": 545.12, "r_y1": 617.41, "r_x2": 545.12, "r_y2": 608.5, "r_x3": 308.86, "r_y3": 608.5, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.36, "r_x1": 545.12, "r_y1": 629.36, "r_x2": 545.12, "r_y2": 620.46, "r_x3": 308.86, "r_y3": 620.46, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.32, "r_x1": 381.68, "r_y1": 641.32, "r_x2": 381.68, "r_y2": 632.41, "r_x3": 308.86, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0, "r_y0": 641.1, "r_x1": 391.75, "r_y1": 641.1, "r_x2": 391.75, "r_y2": 632.25, "r_x3": 384.0, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.75, "r_y0": 641.32, "r_x1": 399.5, "r_y1": 641.32, "r_x2": 399.5, "r_y2": 632.41, "r_x3": 391.75, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.5, "r_y0": 641.1, "r_x1": 407.25, "r_y1": 641.1, "r_x2": 407.25, "r_y2": 632.25, "r_x3": 399.5, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.25, "r_y0": 641.32, "r_x1": 432.91, "r_y1": 641.32, "r_x2": 432.91, "r_y2": 632.41, "r_x3": 407.25, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.91, "r_y0": 641.1, "r_x1": 440.66, "r_y1": 641.1, "r_x2": 440.66, "r_y2": 632.25, "r_x3": 432.91, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.66, "r_y0": 641.32, "r_x1": 545.11, "r_y1": 641.32, "r_x2": 545.11, "r_y2": 632.41, "r_x3": 440.66, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.27, "r_x1": 398.96, "r_y1": 653.27, "r_x2": 398.96, "r_y2": 644.37, "r_x3": 308.86, "r_y3": 644.37, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 656.43, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 665.33, "r_x1": 444.34, "r_y1": 665.33, "r_x2": 444.34, "r_y2": 656.43, "r_x3": 320.82, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.01, "r_y0": 665.1, "r_x1": 545.11, "r_y1": 665.1, "r_x2": 545.11, "r_y2": 656.51, "r_x3": 447.01, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "picture", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 74.31, "t": 77.91, "r": 519.98, "b": 183.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.69, "t": 122.44, "r": 84.93, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.55, "t": 122.44, "r": 93.03, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.5, "t": 115.25, "r": 115.35, "b": 118.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.14, "t": 115.21, "r": 93.29, "b": 118.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.75, "t": 122.44, "r": 104.31, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.75, "t": 127.74, "r": 102.42, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.75, "t": 133.46, "r": 104.31, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.75, "t": 139.17, "r": 102.42, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66, "t": 122.44, "r": 116.14, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66, "t": 127.74, "r": 116.14, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66, "t": 133.46, "r": 116.14, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66, "t": 139.17, "r": 116.14, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.69, "t": 127.74, "r": 84.93, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.55, "t": 127.74, "r": 93.03, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.69, "t": 133.46, "r": 84.93, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.55, "t": 133.46, "r": 93.03, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.69, "t": 139.17, "r": 84.93, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.55, "t": 139.17, "r": 93.03, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.08, "t": 90.5, "r": 113.94, "b": 96.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81, "t": 97.64, "r": 119.21, "b": 103.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94, "t": 100.6, "r": 180.01, "b": 106.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94, "t": 107.74, "r": 172.01, "b": 113.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.77, "t": 80.93, "r": 266.4, "b": 86.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.52, "t": 86.03, "r": 270.65, "b": 91.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.04, "t": 78.56, "r": 352.13, "b": 84.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56, "t": 96.03, "r": 431.73, "b": 101.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82, "t": 102.15, "r": 435.47, "b": 107.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.7, "t": 108.27, "r": 433.6, "b": 114.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.08, "t": 114.39, "r": 431.23, "b": 120.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.23, "t": 151.69, "r": 498.82, "b": 157.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.17, "t": 157.81, "r": 498.88, "b": 163.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.53, "t": 163.93, "r": 489.52, "b": 169.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37, "t": 178.25, "r": 367.72, "b": 183.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84, "t": 123.91, "r": 373.68, "b": 129.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84, "t": 129.01, "r": 381.18, "b": 134.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.63, "t": 88.12, "r": 219.42, "b": 93.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.67, "t": 129.49, "r": 271.5, "b": 135.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.52, "t": 134.59, "r": 270.65, "b": 140.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63, "t": 89.02, "r": 365.55, "b": 94.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63, "t": 97.18, "r": 370.23, "b": 102.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63, "t": 105.34, "r": 374.51, "b": 111.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63, "t": 113.5, "r": 335.73, "b": 119.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.31, "t": 141.79, "r": 335.06, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.31, "t": 148.93, "r": 335.06, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.55, "t": 148.56, "r": 340.95, "b": 154.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56, "t": 148.93, "r": 398.91, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.42, "t": 148.93, "r": 421.59, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.31, "t": 156.07, "r": 349.23, "b": 160.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.31, "t": 163.21, "r": 335.06, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56, "t": 163.21, "r": 374.74, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.31, "t": 170.35, "r": 326.56, "b": 175.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51, "t": 89.67, "r": 326.91, "b": 95.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.72, "t": 97.79, "r": 327.12, "b": 103.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.72, "t": 105.99, "r": 327.12, "b": 111.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.48, "t": 148.55, "r": 404.88, "b": 154.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.7, "t": 162.68, "r": 341.1, "b": 168.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46, "t": 104.55, "r": 457.87, "b": 110.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.33, "t": 91.1, "r": 496.73, "b": 96.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08, "t": 90.57, "r": 457.49, "b": 96.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 203.99, "r": 545.11, "b": 224.97, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.01, "r_x1": 86.88, "r_y1": 213.01, "r_x2": 86.88, "r_y2": 204.11, "r_x3": 50.11, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.02, "r_y0": 212.94, "r_x1": 149.85, "r_y1": 212.94, "r_x2": 149.85, "r_y2": 203.99, "r_x3": 94.02, "r_y3": 203.99, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86, "r_y0": 213.01, "r_x1": 545.11, "r_y1": 213.01, "r_x2": 545.11, "r_y2": 204.11, "r_x3": 152.86, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 224.97, "r_x1": 436.01, "r_y1": 224.97, "r_x2": 436.01, "r_y2": 216.06, "r_x3": 50.11, "r_y3": 216.06, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure." }, { "label": "picture", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 53.03, "t": 257.67, "r": 285.37, "b": 507.67, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.25, "t": 258.21, "r": 101.76, "b": 264.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.3, "t": 258.35, "r": 157.84, "b": 264.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.55, "t": 371.39, "r": 125.68, "b": 377.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.51, "t": 391.32, "r": 84.64, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.53, "t": 391.32, "r": 125.11, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.02, "t": 424.45, "r": 127.92, "b": 430.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.38, "t": 444.89, "r": 84.51, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.4, "t": 444.89, "r": 124.98, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.47, "t": 462.44, "r": 181.63, "b": 468.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61, "t": 478.47, "r": 184.43, "b": 484.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.32, "t": 324.26, "r": 132.92, "b": 330.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51, "t": 269.66, "r": 162.99, "b": 274.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.73, "t": 274.91, "r": 151.41, "b": 279.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.43, "t": 338.96, "r": 80.27, "b": 344.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.6, "t": 343.39, "r": 78.85, "b": 348.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.83, "t": 293.38, "r": 154.66, "b": 298.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99, "t": 297.8, "r": 153.25, "b": 303.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55, "t": 345.36, "r": 197.15, "b": 351.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55, "t": 394.42, "r": 156.68, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.57, "t": 394.42, "r": 197.15, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.19, "t": 375.67, "r": 197.32, "b": 381.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55, "t": 440.25, "r": 156.68, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.57, "t": 440.25, "r": 197.15, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86, "t": 422.09, "r": 199.76, "b": 427.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.57, "t": 314.26, "r": 255.73, "b": 319.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.92, "t": 361.36, "r": 256.08, "b": 367.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.05, "t": 336.62, "r": 248.72, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.29, "t": 336.62, "r": 269.39, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.45, "t": 405.15, "r": 238.74, "b": 410.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.3, "t": 405.2, "r": 271.78, "b": 410.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.55, "t": 382.21, "r": 258.09, "b": 387.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.15, "t": 384.87, "r": 59.51, "b": 449.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.24, "t": 373.81, "r": 59.3, "b": 378.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.3, "t": 484.53, "r": 122.16, "b": 490.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.67, "t": 279.55, "r": 265.32, "b": 285.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17, "t": 500.3, "r": 190.42, "b": 506.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.82, "t": 438.06, "r": 270.78, "b": 443.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.7, "t": 444.06, "r": 263.51, "b": 449.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.75, "t": 293.4, "r": 212.16, "b": 298.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91, "t": 299.15, "r": 216.74, "b": 304.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.25, "t": 282.78, "r": 198.89, "b": 287.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.46, "t": 271.87, "r": 276.47, "b": 277.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65, "t": 323.44, "r": 197.29, "b": 329.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43, "t": 329.44, "r": 184.19, "b": 335.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 8, "page_no": 4, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 50.11, "t": 527.78, "r": 286.37, "b": 680.27, "coord_origin": "TOPLEFT" }, "confidence": 0.891, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 536.81, "r_x1": 229.79, "r_y1": 536.81, "r_x2": 229.79, "r_y2": 527.9, "r_x3": 50.11, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.79, "r_y0": 536.74, "r_x1": 267.76, "r_y1": 536.74, "r_x2": 267.76, "r_y2": 527.78, "r_x3": 231.79, "r_y3": 527.78, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76, "r_y0": 536.81, "r_x1": 286.36, "r_y1": 536.81, "r_x2": 286.36, "r_y2": 527.9, "r_x3": 269.76, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 548.76, "r_x1": 286.37, "r_y1": 548.76, "r_x2": 286.37, "r_y2": 539.86, "r_x3": 50.11, "r_y3": 539.86, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 560.72, "r_x1": 205.85, "r_y1": 560.72, "r_x2": 205.85, "r_y2": 551.81, "r_x3": 50.11, "r_y3": 551.81, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.02, "r_y0": 560.65, "r_x1": 286.36, "r_y1": 560.65, "r_x2": 286.36, "r_y2": 551.69, "r_x3": 208.02, "r_y3": 551.69, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 572.67, "r_x1": 64.5, "r_y1": 572.67, "r_x2": 64.5, "r_y2": 563.77, "r_x3": 50.11, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.17, "r_y0": 572.61, "r_x1": 151.31, "r_y1": 572.61, "r_x2": 151.31, "r_y2": 563.65, "r_x3": 68.17, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31, "r_y0": 572.67, "r_x1": 153.8, "r_y1": 572.67, "r_x2": 153.8, "r_y2": 563.77, "r_x3": 151.31, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.42, "r_y0": 572.67, "r_x1": 241.93, "r_y1": 572.67, "r_x2": 241.93, "r_y2": 563.77, "r_x3": 160.42, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.6, "r_y0": 572.61, "r_x1": 286.36, "r_y1": 572.61, "r_x2": 286.36, "r_y2": 563.65, "r_x3": 245.6, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 584.56, "r_x1": 85.52, "r_y1": 584.56, "r_x2": 85.52, "r_y2": 575.6, "r_x3": 50.11, "r_y3": 575.6, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.62, "r_y0": 584.63, "r_x1": 286.36, "r_y1": 584.63, "r_x2": 286.36, "r_y2": 575.72, "r_x3": 88.62, "r_y3": 575.72, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 596.58, "r_x1": 286.37, "r_y1": 596.58, "r_x2": 286.37, "r_y2": 587.68, "r_x3": 50.11, "r_y3": 587.68, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 608.54, "r_x1": 286.37, "r_y1": 608.54, "r_x2": 286.37, "r_y2": 599.63, "r_x3": 50.11, "r_y3": 599.63, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 620.49, "r_x1": 240.44, "r_y1": 620.49, "r_x2": 240.44, "r_y2": 611.59, "r_x3": 50.11, "r_y3": 611.59, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.2, "r_y0": 620.43, "r_x1": 286.37, "r_y1": 620.43, "r_x2": 286.37, "r_y2": 611.47, "r_x3": 243.2, "r_y3": 611.47, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 632.38, "r_x1": 286.37, "r_y1": 632.38, "r_x2": 286.37, "r_y2": 623.42, "r_x3": 50.11, "r_y3": 623.42, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 644.34, "r_x1": 286.37, "r_y1": 644.34, "r_x2": 286.37, "r_y2": 635.38, "r_x3": 50.11, "r_y3": 635.38, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 656.36, "r_x1": 220.58, "r_y1": 656.36, "r_x2": 220.58, "r_y2": 647.45, "r_x3": 50.11, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.58, "r_y0": 656.14, "r_x1": 228.33, "r_y1": 656.14, "r_x2": 228.33, "r_y2": 647.29, "r_x3": 220.58, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.33, "r_y0": 656.36, "r_x1": 236.08, "r_y1": 656.36, "r_x2": 236.08, "r_y2": 647.45, "r_x3": 228.33, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.08, "r_y0": 656.14, "r_x1": 243.83, "r_y1": 656.14, "r_x2": 243.83, "r_y2": 647.29, "r_x3": 236.08, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.83, "r_y0": 656.36, "r_x1": 255.29, "r_y1": 656.36, "r_x2": 255.29, "r_y2": 647.45, "r_x3": 243.83, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29, "r_y0": 656.14, "r_x1": 263.04, "r_y1": 656.14, "r_x2": 263.04, "r_y2": 647.29, "r_x3": 255.29, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04, "r_y0": 656.36, "r_x1": 286.36, "r_y1": 656.36, "r_x2": 286.36, "r_y2": 647.45, "r_x3": 263.04, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 668.32, "r_x1": 286.37, "r_y1": 668.32, "r_x2": 286.37, "r_y2": 659.41, "r_x3": 50.11, "r_y3": 659.41, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 680.27, "r_x1": 218.47, "r_y1": 680.27, "r_x2": 218.47, "r_y2": 671.36, "r_x3": 50.11, "r_y3": 671.36, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes." }, { "label": "text", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 249.53, "r": 545.12, "b": 294.31, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.44, "r_x1": 523.06, "r_y1": 258.44, "r_x2": 523.06, "r_y2": 249.53, "r_x3": 308.86, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.2, "r_y0": 258.44, "r_x1": 545.12, "r_y1": 258.44, "r_x2": 545.12, "r_y2": 249.53, "r_x3": 525.2, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.4, "r_x1": 517.56, "r_y1": 270.4, "r_x2": 517.56, "r_y2": 261.49, "r_x3": 308.86, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 270.4, "r_x1": 545.11, "r_y1": 270.4, "r_x2": 545.11, "r_y2": 261.49, "r_x3": 520.77, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.35, "r_x1": 534.8, "r_y1": 282.35, "r_x2": 534.8, "r_y2": 273.45, "r_x3": 308.86, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36, "r_y0": 282.35, "r_x1": 545.12, "r_y1": 282.35, "r_x2": 545.12, "r_y2": 273.45, "r_x3": 537.36, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.31, "r_x1": 341.24, "r_y1": 294.31, "r_x2": 341.24, "r_y2": 285.4, "r_x3": 308.86, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73, "r_y0": 294.08, "r_x1": 417.24, "r_y1": 294.08, "r_x2": 417.24, "r_y2": 285.49, "r_x3": 343.73, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23, "r_y0": 294.31, "r_x1": 436.6, "r_y1": 294.31, "r_x2": 436.6, "r_y2": 285.4, "r_x3": 417.23, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09, "r_y0": 294.08, "r_x1": 516.56, "r_y1": 294.08, "r_x2": 516.56, "r_y2": 285.49, "r_x3": 439.09, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56, "r_y0": 294.31, "r_x1": 519.05, "r_y1": 294.31, "r_x2": 519.05, "r_y2": 285.4, "r_x3": 516.56, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 297.34, "r": 545.12, "b": 413.96, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.3, "r_x1": 400.87, "r_y1": 306.3, "r_x2": 400.87, "r_y2": 297.34, "r_x3": 320.82, "r_y3": 297.34, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91, "r_y0": 306.37, "r_x1": 528.34, "r_y1": 306.37, "r_x2": 528.34, "r_y2": 297.46, "r_x3": 403.91, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72, "r_y0": 306.37, "r_x1": 545.11, "r_y1": 306.37, "r_x2": 545.11, "r_y2": 297.46, "r_x3": 530.72, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.32, "r_x1": 517.53, "r_y1": 318.32, "r_x2": 517.53, "r_y2": 309.41, "r_x3": 308.86, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09, "r_y0": 318.32, "r_x1": 545.11, "r_y1": 318.32, "r_x2": 545.11, "r_y2": 309.41, "r_x3": 524.09, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.28, "r_x1": 432.36, "r_y1": 330.28, "r_x2": 432.36, "r_y2": 321.37, "r_x3": 308.86, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.82, "r_y0": 330.05, "r_x1": 510.29, "r_y1": 330.05, "r_x2": 510.29, "r_y2": 321.46, "r_x3": 435.82, "r_y3": 321.46, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.98, "r_y0": 330.28, "r_x1": 520.62, "r_y1": 330.28, "r_x2": 520.62, "r_y2": 321.37, "r_x3": 513.98, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08, "r_y0": 330.28, "r_x1": 545.11, "r_y1": 330.28, "r_x2": 545.11, "r_y2": 321.37, "r_x3": 524.08, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 342.23, "r_x1": 527.76, "r_y1": 342.23, "r_x2": 527.76, "r_y2": 333.32, "r_x3": 308.86, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 342.23, "r_x1": 545.11, "r_y1": 342.23, "r_x2": 545.11, "r_y2": 333.32, "r_x3": 530.73, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.19, "r_x1": 526.85, "r_y1": 354.19, "r_x2": 526.85, "r_y2": 345.28, "r_x3": 308.86, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 354.19, "r_x1": 545.11, "r_y1": 354.19, "r_x2": 545.11, "r_y2": 345.28, "r_x3": 529.62, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.14, "r_x1": 524.51, "r_y1": 366.14, "r_x2": 524.51, "r_y2": 357.24, "r_x3": 308.86, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.97, "r_y0": 366.14, "r_x1": 545.12, "r_y1": 366.14, "r_x2": 545.12, "r_y2": 357.24, "r_x3": 527.97, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.1, "r_x1": 370.39, "r_y1": 378.1, "r_x2": 370.39, "r_y2": 369.19, "r_x3": 308.86, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44, "r_y0": 378.1, "r_x1": 526.91, "r_y1": 378.1, "r_x2": 526.91, "r_y2": 369.19, "r_x3": 377.44, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 378.1, "r_x1": 545.12, "r_y1": 378.1, "r_x2": 545.12, "r_y2": 369.19, "r_x3": 530.73, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.05, "r_x1": 505.46, "r_y1": 390.05, "r_x2": 505.46, "r_y2": 381.15, "r_x3": 308.86, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03, "r_y0": 390.05, "r_x1": 545.12, "r_y1": 390.05, "r_x2": 545.12, "r_y2": 381.15, "r_x3": 508.03, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.01, "r_x1": 517.69, "r_y1": 402.01, "r_x2": 517.69, "r_y2": 393.1, "r_x3": 308.86, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 402.01, "r_x1": 545.11, "r_y1": 402.01, "r_x2": 545.11, "r_y2": 393.1, "r_x3": 520.77, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 413.96, "r_x1": 528.02, "r_y1": 413.96, "r_x2": 528.02, "r_y2": 405.06, "r_x3": 308.86, "r_y3": 405.06, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 417.11, "r": 545.12, "b": 545.57, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 426.02, "r_x1": 515.5, "r_y1": 426.02, "r_x2": 515.5, "r_y2": 417.11, "r_x3": 320.82, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 426.02, "r_x1": 545.11, "r_y1": 426.02, "r_x2": 545.11, "r_y2": 417.11, "r_x3": 520.77, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 437.98, "r_x1": 343.72, "r_y1": 437.98, "r_x2": 343.72, "r_y2": 429.07, "r_x3": 308.86, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.04, "r_y0": 437.75, "r_x1": 446.45, "r_y1": 437.75, "r_x2": 446.45, "r_y2": 429.16, "r_x3": 347.04, "r_y3": 429.16, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.94, "r_y0": 437.98, "r_x1": 503.06, "r_y1": 437.98, "r_x2": 503.06, "r_y2": 429.07, "r_x3": 449.94, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.38, "r_y0": 437.98, "r_x1": 537.37, "r_y1": 437.98, "r_x2": 537.37, "r_y2": 429.07, "r_x3": 506.38, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.69, "r_y0": 437.98, "r_x1": 545.11, "r_y1": 437.98, "r_x2": 545.11, "r_y2": 429.07, "r_x3": 540.69, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 449.93, "r_x1": 522.79, "r_y1": 449.93, "r_x2": 522.79, "r_y2": 441.02, "r_x3": 308.86, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.75, "r_y0": 449.93, "r_x1": 545.12, "r_y1": 449.93, "r_x2": 545.12, "r_y2": 441.02, "r_x3": 525.75, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 461.89, "r_x1": 384.15, "r_y1": 461.89, "r_x2": 384.15, "r_y2": 452.98, "r_x3": 308.86, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37, "r_y0": 461.89, "r_x1": 527.85, "r_y1": 461.89, "r_x2": 527.85, "r_y2": 452.98, "r_x3": 393.37, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39, "r_y0": 461.89, "r_x1": 545.12, "r_y1": 461.89, "r_x2": 545.12, "r_y2": 452.98, "r_x3": 532.39, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.84, "r_x1": 529.76, "r_y1": 473.84, "r_x2": 529.76, "r_y2": 464.94, "r_x3": 308.86, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94, "r_y0": 473.84, "r_x1": 545.12, "r_y1": 473.84, "r_x2": 545.12, "r_y2": 464.94, "r_x3": 532.94, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.8, "r_x1": 514.17, "r_y1": 485.8, "r_x2": 514.17, "r_y2": 476.89, "r_x3": 308.86, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89, "r_y0": 485.8, "r_x1": 545.12, "r_y1": 485.8, "r_x2": 545.12, "r_y2": 476.89, "r_x3": 516.89, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.75, "r_x1": 527.63, "r_y1": 497.75, "r_x2": 527.63, "r_y2": 488.85, "r_x3": 308.86, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.75, "r_x1": 545.11, "r_y1": 497.75, "r_x2": 545.11, "r_y2": 488.85, "r_x3": 529.62, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.71, "r_x1": 508.36, "r_y1": 509.71, "r_x2": 508.36, "r_y2": 500.8, "r_x3": 308.86, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09, "r_y0": 509.71, "r_x1": 545.12, "r_y1": 509.71, "r_x2": 545.12, "r_y2": 500.8, "r_x3": 511.09, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.66, "r_x1": 545.11, "r_y1": 521.66, "r_x2": 545.11, "r_y2": 512.76, "r_x3": 308.86, "r_y3": 512.76, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.62, "r_x1": 545.12, "r_y1": 533.62, "r_x2": 545.12, "r_y2": 524.71, "r_x3": 308.86, "r_y3": 524.71, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.57, "r_x1": 369.73, "r_y1": 545.57, "r_x2": 369.73, "r_y2": 536.67, "r_x3": 308.86, "r_y3": 536.67, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score." }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 548.6, "r": 545.12, "b": 653.27, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 557.56, "r_x1": 404.76, "r_y1": 557.56, "r_x2": 404.76, "r_y2": 548.6, "r_x3": 320.82, "r_y3": 548.6, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34, "r_y0": 557.63, "r_x1": 545.12, "r_y1": 557.63, "r_x2": 545.12, "r_y2": 548.72, "r_x3": 410.34, "r_y3": 548.72, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.59, "r_x1": 545.11, "r_y1": 569.59, "r_x2": 545.11, "r_y2": 560.68, "r_x3": 308.86, "r_y3": 560.68, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.54, "r_x1": 545.12, "r_y1": 581.54, "r_x2": 545.12, "r_y2": 572.64, "r_x3": 308.86, "r_y3": 572.64, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.5, "r_x1": 545.11, "r_y1": 593.5, "r_x2": 545.11, "r_y2": 584.59, "r_x3": 308.86, "r_y3": 584.59, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.45, "r_x1": 545.11, "r_y1": 605.45, "r_x2": 545.11, "r_y2": 596.55, "r_x3": 308.86, "r_y3": 596.55, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.41, "r_x1": 545.12, "r_y1": 617.41, "r_x2": 545.12, "r_y2": 608.5, "r_x3": 308.86, "r_y3": 608.5, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.36, "r_x1": 545.12, "r_y1": 629.36, "r_x2": 545.12, "r_y2": 620.46, "r_x3": 308.86, "r_y3": 620.46, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.32, "r_x1": 381.68, "r_y1": 641.32, "r_x2": 381.68, "r_y2": 632.41, "r_x3": 308.86, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0, "r_y0": 641.1, "r_x1": 391.75, "r_y1": 641.1, "r_x2": 391.75, "r_y2": 632.25, "r_x3": 384.0, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.75, "r_y0": 641.32, "r_x1": 399.5, "r_y1": 641.32, "r_x2": 399.5, "r_y2": 632.41, "r_x3": 391.75, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.5, "r_y0": 641.1, "r_x1": 407.25, "r_y1": 641.1, "r_x2": 407.25, "r_y2": 632.25, "r_x3": 399.5, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.25, "r_y0": 641.32, "r_x1": 432.91, "r_y1": 641.32, "r_x2": 432.91, "r_y2": 632.41, "r_x3": 407.25, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.91, "r_y0": 641.1, "r_x1": 440.66, "r_y1": 641.1, "r_x2": 440.66, "r_y2": 632.25, "r_x3": 432.91, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.66, "r_y0": 641.32, "r_x1": 545.11, "r_y1": 641.32, "r_x2": 545.11, "r_y2": 632.41, "r_x3": 440.66, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.27, "r_x1": 398.96, "r_y1": 653.27, "r_x2": 398.96, "r_y2": 644.37, "r_x3": 308.86, "r_y3": 644.37, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 656.43, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 665.33, "r_x1": 444.34, "r_y1": 665.33, "r_x2": 444.34, "r_y2": 656.43, "r_x3": 320.82, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.01, "r_y0": 665.1, "r_x1": 545.11, "r_y1": 665.1, "r_x2": 545.11, "r_y2": 656.51, "r_x3": 447.01, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-" }, { "label": "page_footer", "id": 9, "page_no": 4, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ], "body": [ { "label": "picture", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 74.31, "t": 77.91, "r": 519.98, "b": 183.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 81.69, "t": 122.44, "r": 84.93, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 125.63, "r_x1": 84.93, "r_y1": 125.63, "r_x2": 84.93, "r_y2": 122.44, "r_x3": 81.69, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 86.55, "t": 122.44, "r": 93.03, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 125.63, "r_x1": 93.03, "r_y1": 125.63, "r_x2": 93.03, "r_y2": 122.44, "r_x3": 86.55, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 102.5, "t": 115.25, "r": 115.35, "b": 118.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.5, "r_y0": 118.44, "r_x1": 115.35, "r_y1": 118.44, "r_x2": 115.35, "r_y2": 115.25, "r_x3": 102.5, "r_y3": 115.25, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 82.14, "t": 115.21, "r": 93.29, "b": 118.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.14, "r_y0": 118.4, "r_x1": 93.29, "r_y1": 118.4, "r_x2": 93.29, "r_y2": 115.21, "r_x3": 82.14, "r_y3": 115.21, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 96.75, "t": 122.44, "r": 104.31, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 125.63, "r_x1": 104.31, "r_y1": 125.63, "r_x2": 104.31, "r_y2": 122.44, "r_x3": 96.75, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 96.75, "t": 127.74, "r": 102.42, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 130.93, "r_x1": 102.42, "r_y1": 130.93, "r_x2": 102.42, "r_y2": 127.74, "r_x3": 96.75, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 96.75, "t": 133.46, "r": 104.31, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 136.64, "r_x1": 104.31, "r_y1": 136.64, "r_x2": 104.31, "r_y2": 133.46, "r_x3": 96.75, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 96.75, "t": 139.17, "r": 102.42, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 96.75, "r_y0": 142.36, "r_x1": 102.42, "r_y1": 142.36, "r_x2": 102.42, "r_y2": 139.17, "r_x3": 96.75, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 110.66, "t": 122.44, "r": 116.14, "b": 125.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 125.63, "r_x1": 116.14, "r_y1": 125.63, "r_x2": 116.14, "r_y2": 122.44, "r_x3": 110.66, "r_y3": 122.44, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 110.66, "t": 127.74, "r": 116.14, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 130.93, "r_x1": 116.14, "r_y1": 130.93, "r_x2": 116.14, "r_y2": 127.74, "r_x3": 110.66, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 110.66, "t": 133.46, "r": 116.14, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 136.64, "r_x1": 116.14, "r_y1": 136.64, "r_x2": 116.14, "r_y2": 133.46, "r_x3": 110.66, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 110.66, "t": 139.17, "r": 116.14, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.66, "r_y0": 142.36, "r_x1": 116.14, "r_y1": 142.36, "r_x2": 116.14, "r_y2": 139.17, "r_x3": 110.66, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 81.69, "t": 127.74, "r": 84.93, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 130.93, "r_x1": 84.93, "r_y1": 130.93, "r_x2": 84.93, "r_y2": 127.74, "r_x3": 81.69, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 86.55, "t": 127.74, "r": 93.03, "b": 130.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 130.93, "r_x1": 93.03, "r_y1": 130.93, "r_x2": 93.03, "r_y2": 127.74, "r_x3": 86.55, "r_y3": 127.74, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 81.69, "t": 133.46, "r": 84.93, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 136.64, "r_x1": 84.93, "r_y1": 136.64, "r_x2": 84.93, "r_y2": 133.46, "r_x3": 81.69, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 86.55, "t": 133.46, "r": 93.03, "b": 136.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 136.64, "r_x1": 93.03, "r_y1": 136.64, "r_x2": 93.03, "r_y2": 133.46, "r_x3": 86.55, "r_y3": 133.46, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 81.69, "t": 139.17, "r": 84.93, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.69, "r_y0": 142.36, "r_x1": 84.93, "r_y1": 142.36, "r_x2": 84.93, "r_y2": 139.17, "r_x3": 81.69, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 86.55, "t": 139.17, "r": 93.03, "b": 142.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.55, "r_y0": 142.36, "r_x1": 93.03, "r_y1": 142.36, "r_x2": 93.03, "r_y2": 139.17, "r_x3": 86.55, "r_y3": 139.17, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 88.08, "t": 90.5, "r": 113.94, "b": 96.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.08, "r_y0": 96.24, "r_x1": 113.94, "r_y1": 96.24, "r_x2": 113.94, "r_y2": 90.5, "r_x3": 88.08, "r_y3": 90.5, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 82.81, "t": 97.64, "r": 119.21, "b": 103.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.81, "r_y0": 103.38, "r_x1": 119.21, "r_y1": 103.38, "r_x2": 119.21, "r_y2": 97.64, "r_x3": 82.81, "r_y3": 97.64, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 143.94, "t": 100.6, "r": 180.01, "b": 106.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.94, "r_y0": 106.34, "r_x1": 180.01, "r_y1": 106.34, "r_x2": 180.01, "r_y2": 100.6, "r_x3": 143.94, "r_y3": 100.6, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 151.94, "t": 107.74, "r": 172.01, "b": 113.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.94, "r_y0": 113.48, "r_x1": 172.01, "r_y1": 113.48, "r_x2": 172.01, "r_y2": 107.74, "r_x3": 151.94, "r_y3": 107.74, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 251.77, "t": 80.93, "r": 266.4, "b": 86.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.77, "r_y0": 86.67, "r_x1": 266.4, "r_y1": 86.67, "r_x2": 266.4, "r_y2": 80.93, "r_x3": 251.77, "r_y3": 80.93, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 247.52, "t": 86.03, "r": 270.65, "b": 91.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 91.77, "r_x1": 270.65, "r_y1": 91.77, "r_x2": 270.65, "r_y2": 86.03, "r_x3": 247.52, "r_y3": 86.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 331.04, "t": 78.56, "r": 352.13, "b": 84.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.04, "r_y0": 84.3, "r_x1": 352.13, "r_y1": 84.3, "r_x2": 352.13, "r_y2": 78.56, "r_x3": 331.04, "r_y3": 78.56, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 390.56, "t": 96.03, "r": 431.73, "b": 101.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.56, "r_y0": 101.77, "r_x1": 431.73, "r_y1": 101.77, "r_x2": 431.73, "r_y2": 96.03, "r_x3": 390.56, "r_y3": 96.03, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 386.82, "t": 102.15, "r": 435.47, "b": 107.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.82, "r_y0": 107.89, "r_x1": 435.47, "r_y1": 107.89, "r_x2": 435.47, "r_y2": 102.15, "r_x3": 386.82, "r_y3": 102.15, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 388.7, "t": 108.27, "r": 433.6, "b": 114.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 114.01, "r_x1": 433.6, "r_y1": 114.01, "r_x2": 433.6, "r_y2": 108.27, "r_x3": 388.7, "r_y3": 108.27, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 391.08, "t": 114.39, "r": 431.23, "b": 120.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.08, "r_y0": 120.13, "r_x1": 431.23, "r_y1": 120.13, "r_x2": 431.23, "r_y2": 114.39, "r_x3": 391.08, "r_y3": 114.39, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 431.23, "t": 151.69, "r": 498.82, "b": 157.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.23, "r_y0": 157.43, "r_x1": 498.82, "r_y1": 157.43, "r_x2": 498.82, "r_y2": 151.69, "r_x3": 431.23, "r_y3": 151.69, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 431.17, "t": 157.81, "r": 498.88, "b": 163.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.17, "r_y0": 163.55, "r_x1": 498.88, "r_y1": 163.55, "r_x2": 498.88, "r_y2": 157.81, "r_x3": 431.17, "r_y3": 157.81, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 440.53, "t": 163.93, "r": 489.52, "b": 169.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.53, "r_y0": 169.67, "r_x1": 489.52, "r_y1": 169.67, "r_x2": 489.52, "r_y2": 163.93, "r_x3": 440.53, "r_y3": 163.93, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 328.37, "t": 178.25, "r": 367.72, "b": 183.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.37, "r_y0": 183.99, "r_x1": 367.72, "r_y1": 183.99, "r_x2": 367.72, "r_y2": 178.25, "r_x3": 328.37, "r_y3": 178.25, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 331.84, "t": 123.91, "r": 373.68, "b": 129.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 129.65, "r_x1": 373.68, "r_y1": 129.65, "r_x2": 373.68, "r_y2": 123.91, "r_x3": 331.84, "r_y3": 123.91, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 331.84, "t": 129.01, "r": 381.18, "b": 134.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.84, "r_y0": 134.75, "r_x1": 381.18, "r_y1": 134.75, "r_x2": 381.18, "r_y2": 129.01, "r_x3": 331.84, "r_y3": 129.01, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 196.63, "t": 88.12, "r": 219.42, "b": 93.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.63, "r_y0": 93.86, "r_x1": 219.42, "r_y1": 93.86, "r_x2": 219.42, "r_y2": 88.12, "r_x3": 196.63, "r_y3": 88.12, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 246.67, "t": 129.49, "r": 271.5, "b": 135.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.67, "r_y0": 135.24, "r_x1": 271.5, "r_y1": 135.24, "r_x2": 271.5, "r_y2": 129.49, "r_x3": 246.67, "r_y3": 129.49, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 247.52, "t": 134.59, "r": 270.65, "b": 140.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.52, "r_y0": 140.34, "r_x1": 270.65, "r_y1": 140.34, "r_x2": 270.65, "r_y2": 134.59, "r_x3": 247.52, "r_y3": 134.59, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 330.63, "t": 89.02, "r": 365.55, "b": 94.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 94.76, "r_x1": 365.55, "r_y1": 94.76, "r_x2": 365.55, "r_y2": 89.02, "r_x3": 330.63, "r_y3": 89.02, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 330.63, "t": 97.18, "r": 370.23, "b": 102.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 102.92, "r_x1": 370.23, "r_y1": 102.92, "r_x2": 370.23, "r_y2": 97.18, "r_x3": 330.63, "r_y3": 97.18, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 330.63, "t": 105.34, "r": 374.51, "b": 111.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 111.08, "r_x1": 374.51, "r_y1": 111.08, "r_x2": 374.51, "r_y2": 105.34, "r_x3": 330.63, "r_y3": 105.34, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 330.63, "t": 113.5, "r": 335.73, "b": 119.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.63, "r_y0": 119.24, "r_x1": 335.73, "r_y1": 119.24, "r_x2": 335.73, "r_y2": 113.5, "r_x3": 330.63, "r_y3": 113.5, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 322.31, "t": 141.79, "r": 335.06, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 146.58, "r_x1": 335.06, "r_y1": 146.58, "r_x2": 335.06, "r_y2": 141.79, "r_x3": 322.31, "r_y3": 141.79, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 322.31, "t": 148.93, "r": 335.06, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 153.72, "r_x1": 335.06, "r_y1": 153.72, "r_x2": 335.06, "r_y2": 148.93, "r_x3": 322.31, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 337.55, "t": 148.56, "r": 340.95, "b": 154.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.55, "r_y0": 154.3, "r_x1": 340.95, "r_y1": 154.3, "r_x2": 340.95, "r_y2": 148.56, "r_x3": 337.55, "r_y3": 148.56, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 343.56, "t": 148.93, "r": 398.91, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 153.72, "r_x1": 398.91, "r_y1": 153.72, "r_x2": 398.91, "r_y2": 148.93, "r_x3": 343.56, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 407.42, "t": 148.93, "r": 421.59, "b": 153.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 153.72, "r_x1": 421.59, "r_y1": 153.72, "r_x2": 421.59, "r_y2": 148.93, "r_x3": 407.42, "r_y3": 148.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 322.31, "t": 156.07, "r": 349.23, "b": 160.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 160.86, "r_x1": 349.23, "r_y1": 160.86, "r_x2": 349.23, "r_y2": 156.07, "r_x3": 322.31, "r_y3": 156.07, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 322.31, "t": 163.21, "r": 335.06, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 168.0, "r_x1": 335.06, "r_y1": 168.0, "r_x2": 335.06, "r_y2": 163.21, "r_x3": 322.31, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 343.56, "t": 163.21, "r": 374.74, "b": 168.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.56, "r_y0": 168.0, "r_x1": 374.74, "r_y1": 168.0, "r_x2": 374.74, "r_y2": 163.21, "r_x3": 343.56, "r_y3": 163.21, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 322.31, "t": 170.35, "r": 326.56, "b": 175.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.31, "r_y0": 175.14, "r_x1": 326.56, "r_y1": 175.14, "r_x2": 326.56, "r_y2": 170.35, "r_x3": 322.31, "r_y3": 170.35, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 323.51, "t": 89.67, "r": 326.91, "b": 95.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.51, "r_y0": 95.41, "r_x1": 326.91, "r_y1": 95.41, "r_x2": 326.91, "r_y2": 89.67, "r_x3": 323.51, "r_y3": 89.67, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 323.72, "t": 97.79, "r": 327.12, "b": 103.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 103.53, "r_x1": 327.12, "r_y1": 103.53, "r_x2": 327.12, "r_y2": 97.79, "r_x3": 323.72, "r_y3": 97.79, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 323.72, "t": 105.99, "r": 327.12, "b": 111.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.72, "r_y0": 111.73, "r_x1": 327.12, "r_y1": 111.73, "r_x2": 327.12, "r_y2": 105.99, "r_x3": 323.72, "r_y3": 105.99, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 401.48, "t": 148.55, "r": 404.88, "b": 154.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.48, "r_y0": 154.29, "r_x1": 404.88, "r_y1": 154.29, "r_x2": 404.88, "r_y2": 148.55, "r_x3": 401.48, "r_y3": 148.55, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 337.7, "t": 162.68, "r": 341.1, "b": 168.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.7, "r_y0": 168.43, "r_x1": 341.1, "r_y1": 168.43, "r_x2": 341.1, "r_y2": 162.68, "r_x3": 337.7, "r_y3": 162.68, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 454.46, "t": 104.55, "r": 457.87, "b": 110.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.46, "r_y0": 110.29, "r_x1": 457.87, "r_y1": 110.29, "r_x2": 457.87, "r_y2": 104.55, "r_x3": 454.46, "r_y3": 104.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 493.33, "t": 91.1, "r": 496.73, "b": 96.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.33, "r_y0": 96.84, "r_x1": 496.73, "r_y1": 96.84, "r_x2": 496.73, "r_y2": 91.1, "r_x3": 493.33, "r_y3": 91.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 454.08, "t": 90.57, "r": 457.49, "b": 96.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.08, "r_y0": 96.31, "r_x1": 457.49, "r_y1": 96.31, "r_x2": 457.49, "r_y2": 90.57, "r_x3": 454.08, "r_y3": 90.57, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 203.99, "r": 545.11, "b": 224.97, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.01, "r_x1": 86.88, "r_y1": 213.01, "r_x2": 86.88, "r_y2": 204.11, "r_x3": 50.11, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.02, "r_y0": 212.94, "r_x1": 149.85, "r_y1": 212.94, "r_x2": 149.85, "r_y2": 203.99, "r_x3": 94.02, "r_y3": 203.99, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.86, "r_y0": 213.01, "r_x1": 545.11, "r_y1": 213.01, "r_x2": 545.11, "r_y2": 204.11, "r_x3": 152.86, "r_y3": 204.11, "coord_origin": "TOPLEFT" }, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 224.97, "r_x1": 436.01, "r_y1": 224.97, "r_x2": 436.01, "r_y2": 216.06, "r_x3": 50.11, "r_y3": 216.06, "coord_origin": "TOPLEFT" }, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure." }, { "label": "picture", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 53.03, "t": 257.67, "r": 285.37, "b": 507.67, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 70, "label": "text", "bbox": { "l": 74.25, "t": 258.21, "r": 101.76, "b": 264.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.25, "r_y0": 264.17, "r_x1": 101.76, "r_y1": 264.17, "r_x2": 101.76, "r_y2": 258.21, "r_x3": 74.25, "r_y3": 258.21, "coord_origin": "TOPLEFT" }, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 122.3, "t": 258.35, "r": 157.84, "b": 264.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.3, "r_y0": 264.31, "r_x1": 157.84, "r_y1": 264.31, "r_x2": 157.84, "r_y2": 258.35, "r_x3": 122.3, "r_y3": 258.35, "coord_origin": "TOPLEFT" }, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 78.55, "t": 371.39, "r": 125.68, "b": 377.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.55, "r_y0": 377.05, "r_x1": 125.68, "r_y1": 377.05, "r_x2": 125.68, "r_y2": 371.39, "r_x3": 78.55, "r_y3": 371.39, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 78.51, "t": 391.32, "r": 84.64, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.51, "r_y0": 396.98, "r_x1": 84.64, "r_y1": 396.98, "r_x2": 84.64, "r_y2": 391.32, "r_x3": 78.51, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 116.53, "t": 391.32, "r": 125.11, "b": 396.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.53, "r_y0": 396.98, "r_x1": 125.11, "r_y1": 396.98, "r_x2": 125.11, "r_y2": 391.32, "r_x3": 116.53, "r_y3": 391.32, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 76.02, "t": 424.45, "r": 127.92, "b": 430.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.02, "r_y0": 430.12, "r_x1": 127.92, "r_y1": 430.12, "r_x2": 127.92, "r_y2": 424.45, "r_x3": 76.02, "r_y3": 424.45, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 78.38, "t": 444.89, "r": 84.51, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.38, "r_y0": 450.55, "r_x1": 84.51, "r_y1": 450.55, "r_x2": 84.51, "r_y2": 444.89, "r_x3": 78.38, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 116.4, "t": 444.89, "r": 124.98, "b": 450.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.4, "r_y0": 450.55, "r_x1": 124.98, "r_y1": 450.55, "r_x2": 124.98, "r_y2": 444.89, "r_x3": 116.4, "r_y3": 444.89, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 167.47, "t": 462.44, "r": 181.63, "b": 468.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.47, "r_y0": 468.11, "r_x1": 181.63, "r_y1": 468.11, "r_x2": 181.63, "r_y2": 462.44, "r_x3": 167.47, "r_y3": 462.44, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 165.61, "t": 478.47, "r": 184.43, "b": 484.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.61, "r_y0": 484.13, "r_x1": 184.43, "r_y1": 484.13, "r_x2": 184.43, "r_y2": 478.47, "r_x3": 165.61, "r_y3": 478.47, "coord_origin": "TOPLEFT" }, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 65.32, "t": 324.26, "r": 132.92, "b": 330.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.32, "r_y0": 330.22, "r_x1": 132.92, "r_y1": 330.22, "r_x2": 132.92, "r_y2": 324.26, "r_x3": 65.32, "r_y3": 324.26, "coord_origin": "TOPLEFT" }, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 119.51, "t": 269.66, "r": 162.99, "b": 274.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.51, "r_y0": 274.73, "r_x1": 162.99, "r_y1": 274.73, "r_x2": 162.99, "r_y2": 269.66, "r_x3": 119.51, "r_y3": 269.66, "coord_origin": "TOPLEFT" }, "text": "[30, 1, 2, 3, 4, \u2026 3, ", "orig": "[30, 1, 2, 3, 4, \u2026 3, ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 128.73, "t": 274.91, "r": 151.41, "b": 279.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.73, "r_y0": 279.98, "r_x1": 151.41, "r_y1": 279.98, "r_x2": 151.41, "r_y2": 274.91, "r_x3": 128.73, "r_y3": 274.91, "coord_origin": "TOPLEFT" }, "text": "4, 5, 8, 31]", "orig": "4, 5, 8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 60.43, "t": 338.96, "r": 80.27, "b": 344.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.43, "r_y0": 344.27, "r_x1": 80.27, "r_y1": 344.27, "r_x2": 80.27, "r_y2": 338.96, "r_x3": 60.43, "r_y3": 338.96, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 60.6, "t": 343.39, "r": 78.85, "b": 348.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.6, "r_y0": 348.7, "r_x1": 78.85, "r_y1": 348.7, "r_x2": 78.85, "r_y2": 343.39, "r_x3": 60.6, "r_y3": 343.39, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 134.83, "t": 293.38, "r": 154.66, "b": 298.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.83, "r_y0": 298.69, "r_x1": 154.66, "r_y1": 298.69, "r_x2": 154.66, "r_y2": 293.38, "r_x3": 134.83, "r_y3": 293.38, "coord_origin": "TOPLEFT" }, "text": "Positional ", "orig": "Positional ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 134.99, "t": 297.8, "r": 153.25, "b": 303.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.99, "r_y0": 303.11, "r_x1": 153.25, "r_y1": 303.11, "r_x2": 153.25, "r_y2": 297.8, "r_x3": 134.99, "r_y3": 297.8, "coord_origin": "TOPLEFT" }, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 150.55, "t": 345.36, "r": 197.15, "b": 351.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 351.02, "r_x1": 197.15, "r_y1": 351.02, "r_x2": 197.15, "r_y2": 345.36, "r_x3": 150.55, "r_y3": 345.36, "coord_origin": "TOPLEFT" }, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 150.55, "t": 394.42, "r": 156.68, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 400.09, "r_x1": 156.68, "r_y1": 400.09, "r_x2": 156.68, "r_y2": 394.42, "r_x3": 150.55, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 188.57, "t": 394.42, "r": 197.15, "b": 400.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 400.09, "r_x1": 197.15, "r_y1": 400.09, "r_x2": 197.15, "r_y2": 394.42, "r_x3": 188.57, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 150.19, "t": 375.67, "r": 197.32, "b": 381.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.19, "r_y0": 381.33, "r_x1": 197.32, "r_y1": 381.33, "r_x2": 197.32, "r_y2": 375.67, "r_x3": 150.19, "r_y3": 375.67, "coord_origin": "TOPLEFT" }, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 150.55, "t": 440.25, "r": 156.68, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.55, "r_y0": 445.91, "r_x1": 156.68, "r_y1": 445.91, "r_x2": 156.68, "r_y2": 440.25, "r_x3": 150.55, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "Add", "orig": "Add", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 188.57, "t": 440.25, "r": 197.15, "b": 445.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.57, "r_y0": 445.91, "r_x1": 197.15, "r_y1": 445.91, "r_x2": 197.15, "r_y2": 440.25, "r_x3": 188.57, "r_y3": 440.25, "coord_origin": "TOPLEFT" }, "text": "& Normalisation", "orig": "& Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 147.86, "t": 422.09, "r": 199.76, "b": 427.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.86, "r_y0": 427.76, "r_x1": 199.76, "r_y1": 427.76, "r_x2": 199.76, "r_y2": 422.09, "r_x3": 147.86, "r_y3": 422.09, "coord_origin": "TOPLEFT" }, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 241.57, "t": 314.26, "r": 255.73, "b": 319.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.57, "r_y0": 319.92, "r_x1": 255.73, "r_y1": 319.92, "r_x2": 255.73, "r_y2": 314.26, "r_x3": 241.57, "r_y3": 314.26, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 241.92, "t": 361.36, "r": 256.08, "b": 367.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.92, "r_y0": 367.03, "r_x1": 256.08, "r_y1": 367.03, "r_x2": 256.08, "r_y2": 361.36, "r_x3": 241.92, "r_y3": 361.36, "coord_origin": "TOPLEFT" }, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 228.05, "t": 336.62, "r": 248.72, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.05, "r_y0": 342.28, "r_x1": 248.72, "r_y1": 342.28, "r_x2": 248.72, "r_y2": 336.62, "r_x3": 228.05, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 246.29, "t": 336.62, "r": 269.39, "b": 342.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 342.28, "r_x1": 269.39, "r_y1": 342.28, "r_x2": 269.39, "r_y2": 336.62, "r_x3": 246.29, "r_y3": 336.62, "coord_origin": "TOPLEFT" }, "text": "Network", "orig": "Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 228.45, "t": 405.15, "r": 238.74, "b": 410.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.45, "r_y0": 410.81, "r_x1": 238.74, "r_y1": 410.81, "r_x2": 238.74, "r_y2": 405.15, "r_x3": 228.45, "r_y3": 405.15, "coord_origin": "TOPLEFT" }, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 256.3, "t": 405.2, "r": 271.78, "b": 410.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.3, "r_y0": 410.87, "r_x1": 271.78, "r_y1": 410.87, "r_x2": 271.78, "r_y2": 405.2, "r_x3": 256.3, "r_y3": 405.2, "coord_origin": "TOPLEFT" }, "text": "Linear ", "orig": "Linear ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 239.55, "t": 382.21, "r": 258.09, "b": 387.88, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.55, "r_y0": 387.88, "r_x1": 258.09, "r_y1": 387.88, "r_x2": 258.09, "r_y2": 382.21, "r_x3": 239.55, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 54.15, "t": 384.87, "r": 59.51, "b": 449.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.15, "r_y0": 449.78, "r_x1": 59.51, "r_y1": 449.78, "r_x2": 59.51, "r_y2": 384.87, "r_x3": 54.15, "r_y3": 384.87, "coord_origin": "TOPLEFT" }, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 54.24, "t": 373.81, "r": 59.3, "b": 378.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.24, "r_y0": 378.45, "r_x1": 59.3, "r_y1": 378.45, "r_x2": 59.3, "r_y2": 373.81, "r_x3": 54.24, "r_y3": 373.81, "coord_origin": "TOPLEFT" }, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 85.3, "t": 484.53, "r": 122.16, "b": 490.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.3, "r_y0": 490.37, "r_x1": 122.16, "r_y1": 490.37, "r_x2": 122.16, "r_y2": 484.53, "r_x3": 85.3, "r_y3": 484.53, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 229.67, "t": 279.55, "r": 265.32, "b": 285.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.67, "r_y0": 285.46, "r_x1": 265.32, "r_y1": 285.46, "r_x2": 265.32, "r_y2": 279.55, "r_x3": 229.67, "r_y3": 279.55, "coord_origin": "TOPLEFT" }, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 157.17, "t": 500.3, "r": 190.42, "b": 506.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.17, "r_y0": 506.13, "r_x1": 190.42, "r_y1": 506.13, "r_x2": 190.42, "r_y2": 500.3, "r_x3": 157.17, "r_y3": 500.3, "coord_origin": "TOPLEFT" }, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 227.82, "t": 438.06, "r": 270.78, "b": 443.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.82, "r_y0": 443.89, "r_x1": 270.78, "r_y1": 443.89, "r_x2": 270.78, "r_y2": 438.06, "r_x3": 227.82, "r_y3": 438.06, "coord_origin": "TOPLEFT" }, "text": "Bounding Boxes & ", "orig": "Bounding Boxes & ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 233.7, "t": 444.06, "r": 263.51, "b": 449.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.7, "r_y0": 449.89, "r_x1": 263.51, "r_y1": 449.89, "r_x2": 263.51, "r_y2": 444.06, "r_x3": 233.7, "r_y3": 444.06, "coord_origin": "TOPLEFT" }, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 184.75, "t": 293.4, "r": 212.16, "b": 298.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.75, "r_y0": 298.76, "r_x1": 212.16, "r_y1": 298.76, "r_x2": 212.16, "r_y2": 293.4, "r_x3": 184.75, "r_y3": 293.4, "coord_origin": "TOPLEFT" }, "text": "Transformer ", "orig": "Transformer ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 178.91, "t": 299.15, "r": 216.74, "b": 304.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.91, "r_y0": 304.51, "r_x1": 216.74, "r_y1": 304.51, "r_x2": 216.74, "r_y2": 299.15, "r_x3": 178.91, "r_y3": 299.15, "coord_origin": "TOPLEFT" }, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 194.25, "t": 282.78, "r": 198.89, "b": 287.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.25, "r_y0": 287.85, "r_x1": 198.89, "r_y1": 287.85, "r_x2": 198.89, "r_y2": 282.78, "r_x3": 194.25, "r_y3": 282.78, "coord_origin": "TOPLEFT" }, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 221.46, "t": 271.87, "r": 276.47, "b": 277.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 277.83, "r_x1": 276.47, "r_y1": 277.83, "r_x2": 276.47, "r_y2": 271.87, "r_x3": 221.46, "r_y3": 271.87, "coord_origin": "TOPLEFT" }, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 151.65, "t": 323.44, "r": 197.29, "b": 329.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.65, "r_y0": 329.1, "r_x1": 197.29, "r_y1": 329.1, "r_x2": 197.29, "r_y2": 323.44, "r_x3": 151.65, "r_y3": 323.44, "coord_origin": "TOPLEFT" }, "text": "Masked Multi-Head ", "orig": "Masked Multi-Head ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 163.43, "t": 329.44, "r": 184.19, "b": 335.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.43, "r_y0": 335.1, "r_x1": 184.19, "r_y1": 335.1, "r_x2": 184.19, "r_y2": 329.44, "r_x3": 163.43, "r_y3": 329.44, "coord_origin": "TOPLEFT" }, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 8, "page_no": 4, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 50.11, "t": 527.78, "r": 286.37, "b": 680.27, "coord_origin": "TOPLEFT" }, "confidence": 0.891, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 536.81, "r_x1": 229.79, "r_y1": 536.81, "r_x2": 229.79, "r_y2": 527.9, "r_x3": 50.11, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "Figure 4: Given an input image of a table, the", "orig": "Figure 4: Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.79, "r_y0": 536.74, "r_x1": 267.76, "r_y1": 536.74, "r_x2": 267.76, "r_y2": 527.78, "r_x3": 231.79, "r_y3": 527.78, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.76, "r_y0": 536.81, "r_x1": 286.36, "r_y1": 536.81, "r_x2": 286.36, "r_y2": 527.9, "r_x3": 269.76, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 548.76, "r_x1": 286.37, "r_y1": 548.76, "r_x2": 286.37, "r_y2": 539.86, "r_x3": 50.11, "r_y3": 539.86, "coord_origin": "TOPLEFT" }, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 560.72, "r_x1": 205.85, "r_y1": 560.72, "r_x2": 205.85, "r_y2": 551.81, "r_x3": 50.11, "r_y3": 551.81, "coord_origin": "TOPLEFT" }, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.02, "r_y0": 560.65, "r_x1": 286.36, "r_y1": 560.65, "r_x2": 286.36, "r_y2": 551.69, "r_x3": 208.02, "r_y3": 551.69, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 572.67, "r_x1": 64.5, "r_y1": 572.67, "r_x2": 64.5, "r_y2": 563.77, "r_x3": 50.11, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.17, "r_y0": 572.61, "r_x1": 151.31, "r_y1": 572.61, "r_x2": 151.31, "r_y2": 563.65, "r_x3": 68.17, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.31, "r_y0": 572.67, "r_x1": 153.8, "r_y1": 572.67, "r_x2": 153.8, "r_y2": 563.77, "r_x3": 151.31, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.42, "r_y0": 572.67, "r_x1": 241.93, "r_y1": 572.67, "r_x2": 241.93, "r_y2": 563.77, "r_x3": 160.42, "r_y3": 563.77, "coord_origin": "TOPLEFT" }, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.6, "r_y0": 572.61, "r_x1": 286.36, "r_y1": 572.61, "r_x2": 286.36, "r_y2": 563.65, "r_x3": 245.6, "r_y3": 563.65, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 584.56, "r_x1": 85.52, "r_y1": 584.56, "r_x2": 85.52, "r_y2": 575.6, "r_x3": 50.11, "r_y3": 575.6, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.62, "r_y0": 584.63, "r_x1": 286.36, "r_y1": 584.63, "r_x2": 286.36, "r_y2": 575.72, "r_x3": 88.62, "r_y3": 575.72, "coord_origin": "TOPLEFT" }, "text": "receives \u2018tokenized tags\u2019 of the HTML code that", "orig": "receives \u2018tokenized tags\u2019 of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 596.58, "r_x1": 286.37, "r_y1": 596.58, "r_x2": 286.37, "r_y2": 587.68, "r_x3": 50.11, "r_y3": 587.68, "coord_origin": "TOPLEFT" }, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 608.54, "r_x1": 286.37, "r_y1": 608.54, "r_x2": 286.37, "r_y2": 599.63, "r_x3": 50.11, "r_y3": 599.63, "coord_origin": "TOPLEFT" }, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 620.49, "r_x1": 240.44, "r_y1": 620.49, "r_x2": 240.44, "r_y2": 611.59, "r_x3": 50.11, "r_y3": 611.59, "coord_origin": "TOPLEFT" }, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.2, "r_y0": 620.43, "r_x1": 286.37, "r_y1": 620.43, "r_x2": 286.37, "r_y2": 611.47, "r_x3": 243.2, "r_y3": 611.47, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 632.38, "r_x1": 286.37, "r_y1": 632.38, "r_x2": 286.37, "r_y2": 623.42, "r_x3": 50.11, "r_y3": 623.42, "coord_origin": "TOPLEFT" }, "text": "Decoder. The linear layer is applied to the features to", "orig": "Decoder. The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 644.34, "r_x1": 286.37, "r_y1": 644.34, "r_x2": 286.37, "r_y2": 635.38, "r_x3": 50.11, "r_y3": 635.38, "coord_origin": "TOPLEFT" }, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 656.36, "r_x1": 220.58, "r_y1": 656.36, "r_x2": 220.58, "r_y2": 647.45, "r_x3": 50.11, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "selects features referring to the data cells (\u2018", "orig": "selects features referring to the data cells (\u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.58, "r_y0": 656.14, "r_x1": 228.33, "r_y1": 656.14, "r_x2": 228.33, "r_y2": 647.29, "r_x3": 220.58, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.33, "r_y0": 656.36, "r_x1": 236.08, "r_y1": 656.36, "r_x2": 236.08, "r_y2": 647.45, "r_x3": 228.33, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.08, "r_y0": 656.14, "r_x1": 243.83, "r_y1": 656.14, "r_x2": 243.83, "r_y2": 647.29, "r_x3": 236.08, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.83, "r_y0": 656.36, "r_x1": 255.29, "r_y1": 656.36, "r_x2": 255.29, "r_y2": 647.45, "r_x3": 243.83, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019, \u2018", "orig": "\u2019, \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.29, "r_y0": 656.14, "r_x1": 263.04, "r_y1": 656.14, "r_x2": 263.04, "r_y2": 647.29, "r_x3": 255.29, "r_y3": 647.29, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.04, "r_y0": 656.36, "r_x1": 286.36, "r_y1": 656.36, "r_x2": 286.36, "r_y2": 647.45, "r_x3": 263.04, "r_y3": 647.45, "coord_origin": "TOPLEFT" }, "text": "\u2019) and", "orig": "\u2019) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 668.32, "r_x1": 286.37, "r_y1": 668.32, "r_x2": 286.37, "r_y2": 659.41, "r_x3": 50.11, "r_y3": 659.41, "coord_origin": "TOPLEFT" }, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 680.27, "r_x1": 218.47, "r_y1": 680.27, "r_x2": 218.47, "r_y2": 671.36, "r_x3": 50.11, "r_y3": 671.36, "coord_origin": "TOPLEFT" }, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes." }, { "label": "text", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 249.53, "r": 545.12, "b": 294.31, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 258.44, "r_x1": 523.06, "r_y1": 258.44, "r_x2": 523.06, "r_y2": 249.53, "r_x3": 308.86, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "forming classification, and adding an adaptive pooling", "orig": "forming classification, and adding an adaptive pooling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.2, "r_y0": 258.44, "r_x1": 545.12, "r_y1": 258.44, "r_x2": 545.12, "r_y2": 249.53, "r_x3": 525.2, "r_y3": 249.53, "coord_origin": "TOPLEFT" }, "text": "layer", "orig": "layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 270.4, "r_x1": 517.56, "r_y1": 270.4, "r_x2": 517.56, "r_y2": 261.49, "r_x3": 308.86, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "of size 28*28. ResNet by default downsamples the", "orig": "of size 28*28. ResNet by default downsamples the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 270.4, "r_x1": 545.11, "r_y1": 270.4, "r_x2": 545.11, "r_y2": 261.49, "r_x3": 520.77, "r_y3": 261.49, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 282.35, "r_x1": 534.8, "r_y1": 282.35, "r_x2": 534.8, "r_y2": 273.45, "r_x3": 308.86, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "resolution by 32 and then the encoded image is provided", "orig": "resolution by 32 and then the encoded image is provided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 537.36, "r_y0": 282.35, "r_x1": 545.12, "r_y1": 282.35, "r_x2": 545.12, "r_y2": 273.45, "r_x3": 537.36, "r_y3": 273.45, "coord_origin": "TOPLEFT" }, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 294.31, "r_x1": 341.24, "r_y1": 294.31, "r_x2": 341.24, "r_y2": 285.4, "r_x3": 308.86, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.73, "r_y0": 294.08, "r_x1": 417.24, "r_y1": 294.08, "r_x2": 417.24, "r_y2": 285.49, "r_x3": 343.73, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 417.23, "r_y0": 294.31, "r_x1": 436.6, "r_y1": 294.31, "r_x2": 436.6, "r_y2": 285.4, "r_x3": 417.23, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.09, "r_y0": 294.08, "r_x1": 516.56, "r_y1": 294.08, "r_x2": 516.56, "r_y2": 285.49, "r_x3": 439.09, "r_y3": 285.49, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.56, "r_y0": 294.31, "r_x1": 519.05, "r_y1": 294.31, "r_x2": 519.05, "r_y2": 285.4, "r_x3": 516.56, "r_y3": 285.4, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 297.34, "r": 545.12, "b": 413.96, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 306.3, "r_x1": 400.87, "r_y1": 306.3, "r_x2": 400.87, "r_y2": 297.34, "r_x3": 320.82, "r_y3": 297.34, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.91, "r_y0": 306.37, "r_x1": 528.34, "r_y1": 306.37, "r_x2": 528.34, "r_y2": 297.46, "r_x3": 403.91, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "The transformer architecture of", "orig": "The transformer architecture of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.72, "r_y0": 306.37, "r_x1": 545.11, "r_y1": 306.37, "r_x2": 545.11, "r_y2": 297.46, "r_x3": 530.72, "r_y3": 297.46, "coord_origin": "TOPLEFT" }, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 318.32, "r_x1": 517.53, "r_y1": 318.32, "r_x2": 517.53, "r_y2": 309.41, "r_x3": 308.86, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.09, "r_y0": 318.32, "r_x1": 545.11, "r_y1": 318.32, "r_x2": 545.11, "r_y2": 309.41, "r_x3": 524.09, "r_y3": 309.41, "coord_origin": "TOPLEFT" }, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 330.28, "r_x1": 432.36, "r_y1": 330.28, "r_x2": 432.36, "r_y2": 321.37, "r_x3": 308.86, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.82, "r_y0": 330.05, "r_x1": 510.29, "r_y1": 330.05, "r_x2": 510.29, "r_y2": 321.46, "r_x3": 435.82, "r_y3": 321.46, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.98, "r_y0": 330.28, "r_x1": 520.62, "r_y1": 330.28, "r_x2": 520.62, "r_y2": 321.37, "r_x3": 513.98, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 524.08, "r_y0": 330.28, "r_x1": 545.11, "r_y1": 330.28, "r_x2": 545.11, "r_y2": 321.37, "r_x3": 524.08, "r_y3": 321.37, "coord_origin": "TOPLEFT" }, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 342.23, "r_x1": 527.76, "r_y1": 342.23, "r_x2": 527.76, "r_y2": 333.32, "r_x3": 308.86, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "eled as a transformer encoder with two encoder layers", "orig": "eled as a transformer encoder with two encoder layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 342.23, "r_x1": 545.11, "r_y1": 342.23, "r_x2": 545.11, "r_y2": 333.32, "r_x3": 530.73, "r_y3": 333.32, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 354.19, "r_x1": 526.85, "r_y1": 354.19, "r_x2": 526.85, "r_y2": 345.28, "r_x3": 308.86, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "a transformer decoder made from a stack of 4 decoder", "orig": "a transformer decoder made from a stack of 4 decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 354.19, "r_x1": 545.11, "r_y1": 354.19, "r_x2": 545.11, "r_y2": 345.28, "r_x3": 529.62, "r_y3": 345.28, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 366.14, "r_x1": 524.51, "r_y1": 366.14, "r_x2": 524.51, "r_y2": 357.24, "r_x3": 308.86, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "ers that comprise mainly of multi-head attention and", "orig": "ers that comprise mainly of multi-head attention and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.97, "r_y0": 366.14, "r_x1": 545.12, "r_y1": 366.14, "r_x2": 545.12, "r_y2": 357.24, "r_x3": 527.97, "r_y3": 357.24, "coord_origin": "TOPLEFT" }, "text": "feed", "orig": "feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 378.1, "r_x1": 370.39, "r_y1": 378.1, "r_x2": 370.39, "r_y2": 369.19, "r_x3": 308.86, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.44, "r_y0": 378.1, "r_x1": 526.91, "r_y1": 378.1, "r_x2": 526.91, "r_y2": 369.19, "r_x3": 377.44, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "This configuration uses fewer layers", "orig": "This configuration uses fewer layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 530.73, "r_y0": 378.1, "r_x1": 545.12, "r_y1": 378.1, "r_x2": 545.12, "r_y2": 369.19, "r_x3": 530.73, "r_y3": 369.19, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 390.05, "r_x1": 505.46, "r_y1": 390.05, "r_x2": 505.46, "r_y2": 381.15, "r_x3": 308.86, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "heads in comparison to networks applied to other", "orig": "heads in comparison to networks applied to other", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.03, "r_y0": 390.05, "r_x1": 545.12, "r_y1": 390.05, "r_x2": 545.12, "r_y2": 381.15, "r_x3": 508.03, "r_y3": 381.15, "coord_origin": "TOPLEFT" }, "text": "problems", "orig": "problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 402.01, "r_x1": 517.69, "r_y1": 402.01, "r_x2": 517.69, "r_y2": 393.1, "r_x3": 308.86, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 402.01, "r_x1": 545.11, "r_y1": 402.01, "r_x2": 545.11, "r_y2": 393.1, "r_x3": 520.77, "r_y3": 393.1, "coord_origin": "TOPLEFT" }, "text": "some-", "orig": "some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 413.96, "r_x1": 528.02, "r_y1": 413.96, "r_x2": 528.02, "r_y2": 405.06, "r_x3": 308.86, "r_y3": 405.06, "coord_origin": "TOPLEFT" }, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 417.11, "r": 545.12, "b": 545.57, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 426.02, "r_x1": 515.5, "r_y1": 426.02, "r_x2": 515.5, "r_y2": 417.11, "r_x3": 320.82, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "The transformer encoder receives an encoded", "orig": "The transformer encoder receives an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 520.77, "r_y0": 426.02, "r_x1": 545.11, "r_y1": 426.02, "r_x2": 545.11, "r_y2": 417.11, "r_x3": 520.77, "r_y3": 417.11, "coord_origin": "TOPLEFT" }, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 437.98, "r_x1": 343.72, "r_y1": 437.98, "r_x2": 343.72, "r_y2": 429.07, "r_x3": 308.86, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.04, "r_y0": 437.75, "r_x1": 446.45, "r_y1": 437.75, "r_x2": 446.45, "r_y2": 429.16, "r_x3": 347.04, "r_y3": 429.16, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.94, "r_y0": 437.98, "r_x1": 503.06, "r_y1": 437.98, "r_x2": 503.06, "r_y2": 429.07, "r_x3": 449.94, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "and refines it", "orig": "and refines it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 506.38, "r_y0": 437.98, "r_x1": 537.37, "r_y1": 437.98, "r_x2": 537.37, "r_y2": 429.07, "r_x3": 506.38, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "through", "orig": "through", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 540.69, "r_y0": 437.98, "r_x1": 545.11, "r_y1": 437.98, "r_x2": 545.11, "r_y2": 429.07, "r_x3": 540.69, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 449.93, "r_x1": 522.79, "r_y1": 449.93, "r_x2": 522.79, "r_y2": 441.02, "r_x3": 308.86, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "multi-head dot-product attention layer, followed by a", "orig": "multi-head dot-product attention layer, followed by a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 525.75, "r_y0": 449.93, "r_x1": 545.12, "r_y1": 449.93, "r_x2": 545.12, "r_y2": 441.02, "r_x3": 525.75, "r_y3": 441.02, "coord_origin": "TOPLEFT" }, "text": "Feed", "orig": "Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 461.89, "r_x1": 384.15, "r_y1": 461.89, "r_x2": 384.15, "r_y2": 452.98, "r_x3": 308.86, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.37, "r_y0": 461.89, "r_x1": 527.85, "r_y1": 461.89, "r_x2": 527.85, "r_y2": 452.98, "r_x3": 393.37, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "During training, the transformer", "orig": "During training, the transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.39, "r_y0": 461.89, "r_x1": 545.12, "r_y1": 461.89, "r_x2": 545.12, "r_y2": 452.98, "r_x3": 532.39, "r_y3": 452.98, "coord_origin": "TOPLEFT" }, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.84, "r_x1": 529.76, "r_y1": 473.84, "r_x2": 529.76, "r_y2": 464.94, "r_x3": 308.86, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "coder receives as input the output feature produced by", "orig": "coder receives as input the output feature produced by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 532.94, "r_y0": 473.84, "r_x1": 545.12, "r_y1": 473.84, "r_x2": 545.12, "r_y2": 464.94, "r_x3": 532.94, "r_y3": 464.94, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.8, "r_x1": 514.17, "r_y1": 485.8, "r_x2": 514.17, "r_y2": 476.89, "r_x3": 308.86, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "transformer encoder, and the tokenized input of the", "orig": "transformer encoder, and the tokenized input of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.89, "r_y0": 485.8, "r_x1": 545.12, "r_y1": 485.8, "r_x2": 545.12, "r_y2": 476.89, "r_x3": 516.89, "r_y3": 476.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.75, "r_x1": 527.63, "r_y1": 497.75, "r_x2": 527.63, "r_y2": 488.85, "r_x3": 308.86, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "ground-truth tags. Using a stack of multi-head attention", "orig": "ground-truth tags. Using a stack of multi-head attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 529.62, "r_y0": 497.75, "r_x1": 545.11, "r_y1": 497.75, "r_x2": 545.11, "r_y2": 488.85, "r_x3": 529.62, "r_y3": 488.85, "coord_origin": "TOPLEFT" }, "text": "lay-", "orig": "lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 509.71, "r_x1": 508.36, "r_y1": 509.71, "r_x2": 508.36, "r_y2": 500.8, "r_x3": 308.86, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "ers, different aspects of the tag sequence could be", "orig": "ers, different aspects of the tag sequence could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.09, "r_y0": 509.71, "r_x1": 545.12, "r_y1": 509.71, "r_x2": 545.12, "r_y2": 500.8, "r_x3": 511.09, "r_y3": 500.8, "coord_origin": "TOPLEFT" }, "text": "inferred.", "orig": "inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 521.66, "r_x1": 545.11, "r_y1": 521.66, "r_x2": 545.11, "r_y2": 512.76, "r_x3": 308.86, "r_y3": 512.76, "coord_origin": "TOPLEFT" }, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.62, "r_x1": 545.12, "r_y1": 533.62, "r_x2": 545.12, "r_y2": 524.71, "r_x3": 308.86, "r_y3": 524.71, "coord_origin": "TOPLEFT" }, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.57, "r_x1": 369.73, "r_y1": 545.57, "r_x2": 369.73, "r_y2": 536.67, "r_x3": 308.86, "r_y3": 536.67, "coord_origin": "TOPLEFT" }, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score." }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 548.6, "r": 545.12, "b": 653.27, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 557.56, "r_x1": 404.76, "r_y1": 557.56, "r_x2": 404.76, "r_y2": 548.6, "r_x3": 320.82, "r_y3": 548.6, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.34, "r_y0": 557.63, "r_x1": 545.12, "r_y1": 557.63, "r_x2": 545.12, "r_y2": 548.72, "r_x3": 410.34, "r_y3": 548.72, "coord_origin": "TOPLEFT" }, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.59, "r_x1": 545.11, "r_y1": 569.59, "r_x2": 545.11, "r_y2": 560.68, "r_x3": 308.86, "r_y3": 560.68, "coord_origin": "TOPLEFT" }, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.54, "r_x1": 545.12, "r_y1": 581.54, "r_x2": 545.12, "r_y2": 572.64, "r_x3": 308.86, "r_y3": 572.64, "coord_origin": "TOPLEFT" }, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.5, "r_x1": 545.11, "r_y1": 593.5, "r_x2": 545.11, "r_y2": 584.59, "r_x3": 308.86, "r_y3": 584.59, "coord_origin": "TOPLEFT" }, "text": "to end. This approach is inspired by DETR [1] which em-", "orig": "to end. This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.45, "r_x1": 545.11, "r_y1": 605.45, "r_x2": 545.11, "r_y2": 596.55, "r_x3": 308.86, "r_y3": 596.55, "coord_origin": "TOPLEFT" }, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.41, "r_x1": 545.12, "r_y1": 617.41, "r_x2": 545.12, "r_y2": 608.5, "r_x3": 308.86, "r_y3": 608.5, "coord_origin": "TOPLEFT" }, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.36, "r_x1": 545.12, "r_y1": 629.36, "r_x2": 545.12, "r_y2": 620.46, "r_x3": 308.86, "r_y3": 620.46, "coord_origin": "TOPLEFT" }, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.32, "r_x1": 381.68, "r_y1": 641.32, "r_x2": 381.68, "r_y2": 632.41, "r_x3": 308.86, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.0, "r_y0": 641.1, "r_x1": 391.75, "r_y1": 641.1, "r_x2": 391.75, "r_y2": 632.25, "r_x3": 384.0, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.75, "r_y0": 641.32, "r_x1": 399.5, "r_y1": 641.32, "r_x2": 399.5, "r_y2": 632.41, "r_x3": 391.75, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 399.5, "r_y0": 641.1, "r_x1": 407.25, "r_y1": 641.1, "r_x2": 407.25, "r_y2": 632.25, "r_x3": 399.5, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.25, "r_y0": 641.32, "r_x1": 432.91, "r_y1": 641.32, "r_x2": 432.91, "r_y2": 632.41, "r_x3": 407.25, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 and \u2018", "orig": "\u2019 and \u2018", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.91, "r_y0": 641.1, "r_x1": 440.66, "r_y1": 641.1, "r_x2": 440.66, "r_y2": 632.25, "r_x3": 432.91, "r_y3": 632.25, "coord_origin": "TOPLEFT" }, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.66, "r_y0": 641.32, "r_x1": 545.11, "r_y1": 641.32, "r_x2": 545.11, "r_y2": 632.41, "r_x3": 440.66, "r_y3": 632.41, "coord_origin": "TOPLEFT" }, "text": "\u2019 HTML structure tags be-", "orig": "\u2019 HTML structure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.27, "r_x1": 398.96, "r_y1": 653.27, "r_x2": 398.96, "r_y2": 644.37, "r_x3": 308.86, "r_y3": 644.37, "coord_origin": "TOPLEFT" }, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 656.43, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 665.33, "r_x1": 444.34, "r_y1": 665.33, "r_x2": 444.34, "r_y2": 656.43, "r_x3": 320.82, "r_y3": 656.43, "coord_origin": "TOPLEFT" }, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 447.01, "r_y0": 665.1, "r_x1": 545.11, "r_y1": 665.1, "r_x2": 545.11, "r_y2": 656.51, "r_x3": 447.01, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.29, "r_x1": 545.12, "r_y1": 677.29, "r_x2": 545.12, "r_y2": 668.38, "r_x3": 308.86, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 308.86, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "provide an attention weighted encoding. This weighted at-", "orig": "provide an attention weighted encoding. This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-" } ], "headers": [ { "label": "page_footer", "id": 9, "page_no": 4, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ] } }, { "page_no": 5, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 286.37, "r_y1": 96.07, "r_x2": 286.37, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 286.37, "r_y1": 108.02, "r_x2": 286.37, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 119.98, "r_x1": 286.37, "r_y1": 119.98, "r_x2": 286.37, "r_y2": 111.07, "r_x3": 50.11, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.93, "r_x1": 286.37, "r_y1": 131.93, "r_x2": 286.37, "r_y2": 123.03, "r_x3": 50.11, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.89, "r_x1": 286.37, "r_y1": 143.89, "r_x2": 286.37, "r_y2": 134.98, "r_x3": 50.11, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.85, "r_x1": 175.16, "r_y1": 155.85, "r_x2": 175.16, "r_y2": 146.94, "r_x3": 50.11, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 168.53, "r_x1": 286.36, "r_y1": 168.53, "r_x2": 286.36, "r_y2": 159.62, "r_x3": 62.07, "r_y3": 159.62, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.49, "r_x1": 286.37, "r_y1": 180.49, "r_x2": 286.37, "r_y2": 171.58, "r_x3": 50.11, "r_y3": 171.58, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.44, "r_x1": 286.37, "r_y1": 192.44, "r_x2": 286.37, "r_y2": 183.54, "r_x3": 50.11, "r_y3": 183.54, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.4, "r_x1": 286.37, "r_y1": 204.4, "r_x2": 286.37, "r_y2": 195.49, "r_x3": 50.11, "r_y3": 195.49, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.35, "r_x1": 286.37, "r_y1": 216.35, "r_x2": 286.37, "r_y2": 207.45, "r_x3": 50.11, "r_y3": 207.45, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.31, "r_x1": 286.37, "r_y1": 228.31, "r_x2": 286.37, "r_y2": 219.4, "r_x3": 50.11, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 240.26, "r_x1": 181.55, "r_y1": 240.26, "r_x2": 181.55, "r_y2": 231.36, "r_x3": 50.11, "r_y3": 231.36, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.88, "r_x1": 129.21, "r_y1": 252.88, "r_x2": 129.21, "r_y2": 243.92, "r_x3": 62.07, "r_y3": 243.92, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.45, "r_y0": 252.95, "r_x1": 286.36, "r_y1": 252.95, "r_x2": 286.36, "r_y2": 244.04, "r_x3": 134.45, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.9, "r_x1": 286.37, "r_y1": 264.9, "r_x2": 286.37, "r_y2": 256.0, "r_x3": 50.11, "r_y3": 256.0, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.64, "r_x1": 56.85, "r_y1": 276.64, "r_x2": 56.85, "r_y2": 267.79, "r_x3": 50.11, "r_y3": 267.79, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.34, "r_y0": 276.86, "r_x1": 135.4, "r_y1": 276.86, "r_x2": 135.4, "r_y2": 267.95, "r_x3": 57.34, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.74, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04, "r_x3": 137.74, "r_y3": 268.04, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.64, "r_y0": 276.86, "r_x1": 286.36, "r_y1": 276.86, "r_x2": 286.36, "r_y2": 267.95, "r_x3": 213.64, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.81, "r_x1": 158.82, "r_y1": 288.81, "r_x2": 158.82, "r_y2": 279.91, "r_x3": 50.11, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.32, "r_y0": 288.58, "r_x1": 238.8, "r_y1": 288.58, "r_x2": 238.8, "r_y2": 280.0, "r_x3": 161.32, "r_y3": 280.0, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.52, "r_y0": 288.81, "r_x1": 286.36, "r_y1": 288.81, "r_x2": 286.36, "r_y2": 279.91, "r_x3": 241.52, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.77, "r_x1": 211.38, "r_y1": 300.77, "r_x2": 211.38, "r_y2": 291.86, "r_x3": 50.11, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.27, "r_y0": 300.55, "r_x1": 229.2, "r_y1": 300.55, "r_x2": 229.2, "r_y2": 291.7, "r_x3": 214.27, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.7, "r_y0": 300.77, "r_x1": 232.19, "r_y1": 300.77, "r_x2": 232.19, "r_y2": 291.86, "r_x3": 229.7, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49, "r_y0": 300.55, "r_x1": 251.42, "r_y1": 300.55, "r_x2": 251.42, "r_y2": 291.7, "r_x3": 236.49, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81, "r_y0": 300.77, "r_x1": 286.36, "r_y1": 300.77, "r_x2": 286.36, "r_y2": 291.86, "r_x3": 254.81, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.72, "r_x1": 137.45, "r_y1": 312.72, "r_x2": 137.45, "r_y2": 303.82, "r_x3": 50.11, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.3, "r_y0": 312.5, "r_x1": 148.24, "r_y1": 312.5, "r_x2": 148.24, "r_y2": 303.66, "r_x3": 141.3, "r_y3": 303.66, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.59, "r_y0": 312.72, "r_x1": 286.36, "r_y1": 312.72, "r_x2": 286.36, "r_y2": 303.82, "r_x3": 152.59, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.68, "r_x1": 89.68, "r_y1": 324.68, "r_x2": 89.68, "r_y2": 315.77, "r_x3": 50.11, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.69, "r_y0": 324.46, "r_x1": 104.12, "r_y1": 324.46, "r_x2": 104.12, "r_y2": 315.61, "r_x3": 89.69, "r_y3": 315.61, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.62, "r_y0": 324.68, "r_x1": 286.37, "r_y1": 324.68, "r_x2": 286.37, "r_y2": 315.77, "r_x3": 104.62, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.64, "r_x1": 286.37, "r_y1": 336.64, "r_x2": 286.37, "r_y2": 327.73, "r_x3": 50.11, "r_y3": 327.73, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.59, "r_x1": 286.37, "r_y1": 348.59, "r_x2": 286.37, "r_y2": 339.68, "r_x3": 50.11, "r_y3": 339.68, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.54, "r_x1": 286.37, "r_y1": 360.54, "r_x2": 286.37, "r_y2": 351.64, "r_x3": 50.11, "r_y3": 351.64, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.5, "r_x1": 286.37, "r_y1": 372.5, "r_x2": 286.37, "r_y2": 363.59, "r_x3": 50.11, "r_y3": 363.59, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.45, "r_x1": 286.37, "r_y1": 384.45, "r_x2": 286.37, "r_y2": 375.55, "r_x3": 50.11, "r_y3": 375.55, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.41, "r_x1": 286.37, "r_y1": 396.41, "r_x2": 286.37, "r_y2": 387.5, "r_x3": 50.11, "r_y3": 387.5, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.37, "r_x1": 88.69, "r_y1": 408.37, "r_x2": 88.69, "r_y2": 399.46, "r_x3": 50.11, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.65, "r_y0": 408.14, "r_x1": 170.05, "r_y1": 408.14, "r_x2": 170.05, "r_y2": 399.55, "r_x3": 91.65, "r_y3": 399.55, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05, "r_y0": 408.37, "r_x1": 286.36, "r_y1": 408.37, "r_x2": 286.36, "r_y2": 399.46, "r_x3": 170.05, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.32, "r_x1": 181.97, "r_y1": 420.32, "r_x2": 181.97, "r_y2": 411.41, "r_x3": 50.11, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09, "r_y0": 420.32, "r_x1": 197.75, "r_y1": 420.32, "r_x2": 197.75, "r_y2": 411.41, "r_x3": 189.09, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.35, "r_y0": 420.32, "r_x1": 286.37, "r_y1": 420.32, "r_x2": 286.37, "r_y2": 411.41, "r_x3": 200.35, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.28, "r_x1": 286.37, "r_y1": 432.28, "r_x2": 286.37, "r_y2": 423.37, "r_x3": 50.11, "r_y3": 423.37, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.23, "r_x1": 158.3, "r_y1": 444.23, "r_x2": 158.3, "r_y2": 435.32, "r_x3": 50.11, "r_y3": 435.32, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 456.92, "r_x1": 286.36, "r_y1": 456.92, "r_x2": 286.36, "r_y2": 448.01, "r_x3": 62.07, "r_y3": 448.01, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 468.87, "r_x1": 91.38, "r_y1": 468.87, "r_x2": 91.38, "r_y2": 459.97, "r_x3": 50.11, "r_y3": 459.97, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.72, "r_y0": 502.13, "r_x1": 140.64, "r_y1": 502.13, "r_x2": 140.64, "r_y2": 493.28, "r_x3": 125.72, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.91, "r_y0": 502.13, "r_x1": 151.66, "r_y1": 502.13, "r_x2": 151.66, "r_y2": 493.28, "r_x3": 143.91, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42, "r_y0": 502.13, "r_x1": 186.63, "r_y1": 502.13, "r_x2": 186.63, "r_y2": 493.28, "r_x3": 154.42, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34, "r_y0": 502.13, "r_x1": 197.09, "r_y1": 502.13, "r_x2": 197.09, "r_y2": 493.28, "r_x3": 189.34, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.3, "r_y0": 502.13, "r_x1": 211.65, "r_y1": 502.13, "r_x2": 211.65, "r_y2": 493.28, "r_x3": 199.3, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33, "r_y0": 517.07, "r_x1": 127.3, "r_y1": 517.07, "r_x2": 127.3, "r_y2": 508.22, "r_x3": 124.33, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.27, "r_y0": 517.07, "r_x1": 138.01, "r_y1": 517.07, "r_x2": 138.01, "r_y2": 508.22, "r_x3": 130.27, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78, "r_y0": 517.07, "r_x1": 153.33, "r_y1": 517.07, "r_x2": 153.33, "r_y2": 508.22, "r_x3": 140.78, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.04, "r_y0": 517.07, "r_x1": 174.86, "r_y1": 517.07, "r_x2": 174.86, "r_y2": 508.22, "r_x3": 156.04, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07, "r_y0": 517.07, "r_x1": 184.82, "r_y1": 517.07, "r_x2": 184.82, "r_y2": 507.67, "r_x3": 177.07, "r_y3": 507.67, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03, "r_y0": 517.07, "r_x1": 192.84, "r_y1": 517.07, "r_x2": 192.84, "r_y2": 508.22, "r_x3": 187.03, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.85, "r_y0": 517.07, "r_x1": 196.72, "r_y1": 517.07, "r_x2": 196.72, "r_y2": 508.22, "r_x3": 192.85, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.72, "r_y0": 517.07, "r_x1": 211.65, "r_y1": 517.07, "r_x2": 211.65, "r_y2": 508.22, "r_x3": 196.72, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 509.92, "r_x1": 286.36, "r_y1": 509.92, "r_x2": 286.36, "r_y2": 501.01, "r_x3": 274.75, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 540.22, "r_x1": 74.45, "r_y1": 540.22, "r_x2": 74.45, "r_y2": 531.31, "r_x3": 50.11, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.94, "r_y0": 540.0, "r_x1": 82.75, "r_y1": 540.0, "r_x2": 82.75, "r_y2": 531.15, "r_x3": 76.94, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.52, "r_y0": 540.0, "r_x1": 92.16, "r_y1": 540.0, "r_x2": 92.16, "r_y2": 530.59, "r_x3": 85.52, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.65, "r_y0": 540.22, "r_x1": 135.6, "r_y1": 540.22, "r_x2": 135.6, "r_y2": 531.31, "r_x3": 94.65, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09, "r_y0": 540.0, "r_x1": 172.63, "r_y1": 540.0, "r_x2": 172.63, "r_y2": 531.15, "r_x3": 138.09, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.9, "r_y0": 540.0, "r_x1": 192.5, "r_y1": 540.0, "r_x2": 192.5, "r_y2": 530.59, "r_x3": 175.9, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99, "r_y0": 540.22, "r_x1": 281.6, "r_y1": 540.22, "r_x2": 281.6, "r_y2": 531.31, "r_x3": 194.99, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 566.66, "r_x1": 57.93, "r_y1": 566.66, "r_x2": 57.93, "r_y2": 555.92, "r_x3": 50.11, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.35, "r_y0": 566.66, "r_x1": 171.98, "r_y1": 566.66, "r_x2": 171.98, "r_y2": 555.92, "r_x3": 68.35, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.12, "r_x1": 64.69, "r_y1": 586.12, "r_x2": 64.69, "r_y2": 576.26, "r_x3": 50.11, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.41, "r_y0": 586.12, "r_x1": 179.18, "r_y1": 586.12, "r_x2": 179.18, "r_y2": 576.26, "r_x3": 74.41, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 604.64, "r_x1": 202.98, "r_y1": 604.64, "r_x2": 202.98, "r_y2": 595.73, "r_x3": 62.07, "r_y3": 595.73, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38, "r_y0": 604.41, "r_x1": 286.36, "r_y1": 604.41, "r_x2": 286.36, "r_y2": 595.82, "r_x3": 205.38, "r_y3": 595.82, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 616.37, "r_x1": 70.04, "r_y1": 616.37, "r_x2": 70.04, "r_y2": 607.78, "r_x3": 50.11, "r_y3": 607.78, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 616.6, "r_x1": 286.36, "r_y1": 616.6, "r_x2": 286.36, "r_y2": 607.69, "r_x3": 70.04, "r_y3": 607.69, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 628.55, "r_x1": 286.37, "r_y1": 628.55, "r_x2": 286.37, "r_y2": 619.64, "r_x3": 50.11, "r_y3": 619.64, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 640.51, "r_x1": 207.03, "r_y1": 640.51, "r_x2": 207.03, "r_y2": 631.6, "r_x3": 50.11, "r_y3": 631.6, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.66, "r_y0": 663.45, "r_x1": 186.02, "r_y1": 663.45, "r_x2": 186.02, "r_y2": 654.55, "r_x3": 91.66, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.51, "r_y0": 663.23, "r_x1": 196.26, "r_y1": 663.23, "r_x2": 196.26, "r_y2": 653.83, "r_x3": 188.51, "r_y3": 653.83, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.75, "r_y0": 663.45, "r_x1": 244.81, "r_y1": 663.45, "r_x2": 244.81, "r_y2": 654.55, "r_x3": 198.75, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.02, "r_y0": 678.4, "r_x1": 186.25, "r_y1": 678.4, "r_x2": 186.25, "r_y2": 669.49, "r_x3": 101.02, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.74, "r_y0": 678.18, "r_x1": 196.48, "r_y1": 678.18, "r_x2": 196.48, "r_y2": 668.77, "r_x3": 188.74, "r_y3": 668.77, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.98, "r_y0": 678.4, "r_x1": 244.81, "r_y1": 678.4, "r_x2": 244.81, "r_y2": 669.49, "r_x3": 198.98, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 671.02, "r_x1": 286.36, "r_y1": 671.02, "r_x2": 286.36, "r_y2": 662.12, "r_x3": 274.75, "r_y3": 662.12, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 339.99, "r_y1": 96.07, "r_x2": 339.99, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.89, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 346.89, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 492.96, "r_y1": 108.02, "r_x2": 492.96, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 125.14, "r_x1": 545.11, "r_y1": 125.14, "r_x2": 545.11, "r_y2": 116.23, "r_x3": 320.82, "r_y3": 116.23, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 137.09, "r_x1": 545.12, "r_y1": 137.09, "r_x2": 545.12, "r_y2": 128.18, "r_x3": 308.86, "r_y3": 128.18, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 149.05, "r_x1": 545.12, "r_y1": 149.05, "r_x2": 545.12, "r_y2": 140.14, "r_x3": 308.86, "r_y3": 140.14, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 161.0, "r_x1": 545.12, "r_y1": 161.0, "r_x2": 545.12, "r_y2": 152.09, "r_x3": 308.86, "r_y3": 152.09, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 172.96, "r_x1": 545.12, "r_y1": 172.96, "r_x2": 545.12, "r_y2": 164.05, "r_x3": 308.86, "r_y3": 164.05, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 184.91, "r_x1": 467.22, "r_y1": 184.91, "r_x2": 467.22, "r_y2": 176.01, "r_x3": 308.86, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.44, "r_y0": 184.91, "r_x1": 545.12, "r_y1": 184.91, "r_x2": 545.12, "r_y2": 176.01, "r_x3": 475.44, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 196.87, "r_x1": 545.12, "r_y1": 196.87, "r_x2": 545.12, "r_y2": 187.96, "r_x3": 308.86, "r_y3": 187.96, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 208.82, "r_x1": 545.12, "r_y1": 208.82, "r_x2": 545.12, "r_y2": 199.92, "r_x3": 308.86, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 220.78, "r_x1": 545.12, "r_y1": 220.78, "r_x2": 545.12, "r_y2": 211.87, "r_x3": 308.86, "r_y3": 211.87, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.73, "r_x1": 545.12, "r_y1": 232.73, "r_x2": 545.12, "r_y2": 223.83, "r_x3": 308.86, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 244.69, "r_x1": 545.12, "r_y1": 244.69, "r_x2": 545.12, "r_y2": 235.78, "r_x3": 308.86, "r_y3": 235.78, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.64, "r_x1": 545.12, "r_y1": 256.64, "r_x2": 545.12, "r_y2": 247.74, "r_x3": 308.86, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.6, "r_x1": 342.34, "r_y1": 268.6, "r_x2": 342.34, "r_y2": 259.69, "r_x3": 308.86, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95, "r_y0": 268.6, "r_x1": 545.12, "r_y1": 268.6, "r_x2": 545.12, "r_y2": 259.69, "r_x3": 348.95, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.55, "r_x1": 545.12, "r_y1": 280.55, "r_x2": 545.12, "r_y2": 271.65, "r_x3": 308.86, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.51, "r_x1": 545.12, "r_y1": 292.51, "r_x2": 545.12, "r_y2": 283.6, "r_x3": 308.86, "r_y3": 283.6, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.46, "r_x1": 545.12, "r_y1": 304.46, "r_x2": 545.12, "r_y2": 295.56, "r_x3": 308.86, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.42, "r_x1": 545.12, "r_y1": 316.42, "r_x2": 545.12, "r_y2": 307.51, "r_x3": 308.86, "r_y3": 307.51, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.37, "r_x1": 532.48, "r_y1": 328.37, "r_x2": 532.48, "r_y2": 319.47, "r_x3": 308.86, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 345.48, "r_x1": 545.11, "r_y1": 345.48, "r_x2": 545.11, "r_y2": 336.58, "r_x3": 320.82, "r_y3": 336.58, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 357.44, "r_x1": 403.74, "r_y1": 357.44, "r_x2": 403.74, "r_y2": 348.53, "r_x3": 308.86, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.08, "r_y0": 357.21, "r_x1": 503.54, "r_y1": 357.21, "r_x2": 503.54, "r_y2": 348.62, "r_x3": 406.08, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.54, "r_y0": 357.44, "r_x1": 506.03, "r_y1": 357.44, "r_x2": 506.03, "r_y2": 348.53, "r_x3": 503.54, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.4, "r_y0": 357.21, "r_x1": 545.11, "r_y1": 357.21, "r_x2": 545.11, "r_y2": 348.62, "r_x3": 508.4, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 369.16, "r_x1": 343.16, "r_y1": 369.16, "r_x2": 343.16, "r_y2": 360.58, "r_x3": 308.86, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16, "r_y0": 369.39, "r_x1": 362.2, "r_y1": 369.39, "r_x2": 362.2, "r_y2": 360.49, "r_x3": 343.16, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.29, "r_y0": 369.16, "r_x1": 440.94, "r_y1": 369.16, "r_x2": 440.94, "r_y2": 360.58, "r_x3": 364.29, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.94, "r_y0": 369.39, "r_x1": 545.11, "r_y1": 369.39, "r_x2": 545.11, "r_y2": 360.49, "r_x3": 440.94, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 381.35, "r_x1": 545.12, "r_y1": 381.35, "r_x2": 545.12, "r_y2": 372.44, "r_x3": 308.86, "r_y3": 372.44, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 393.31, "r_x1": 545.12, "r_y1": 393.31, "r_x2": 545.12, "r_y2": 384.4, "r_x3": 308.86, "r_y3": 384.4, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 405.04, "r_x1": 314.67, "r_y1": 405.04, "r_x2": 314.67, "r_y2": 396.19, "r_x3": 308.86, "r_y3": 396.19, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.66, "r_y0": 405.26, "r_x1": 360.39, "r_y1": 405.26, "r_x2": 360.39, "r_y2": 396.35, "r_x3": 318.66, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96, "r_y0": 405.26, "r_x1": 545.11, "r_y1": 405.26, "r_x2": 545.11, "r_y2": 396.35, "r_x3": 367.96, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 417.21, "r_x1": 545.12, "r_y1": 417.21, "r_x2": 545.12, "r_y2": 408.31, "r_x3": 308.86, "r_y3": 408.31, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 429.17, "r_x1": 360.97, "r_y1": 429.17, "r_x2": 360.97, "r_y2": 420.26, "r_x3": 308.86, "r_y3": 420.26, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 446.28, "r_x1": 545.11, "r_y1": 446.28, "r_x2": 545.11, "r_y2": 437.37, "r_x3": 320.82, "r_y3": 437.37, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 458.24, "r_x1": 384.63, "r_y1": 458.24, "r_x2": 384.63, "r_y2": 449.33, "r_x3": 308.86, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 458.24, "r_x1": 545.12, "r_y1": 458.24, "r_x2": 545.12, "r_y2": 449.33, "r_x3": 391.37, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 470.19, "r_x1": 494.01, "r_y1": 470.19, "r_x2": 494.01, "r_y2": 461.28, "r_x3": 308.86, "r_y3": 461.28, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.08, "r_y0": 469.96, "r_x1": 545.11, "r_y1": 469.96, "r_x2": 545.11, "r_y2": 461.37, "r_x3": 498.08, "r_y3": 461.37, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 481.92, "r_x1": 364.44, "r_y1": 481.92, "r_x2": 364.44, "r_y2": 473.33, "r_x3": 308.86, "r_y3": 473.33, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 482.15, "r_x1": 545.11, "r_y1": 482.15, "r_x2": 545.11, "r_y2": 473.24, "r_x3": 367.06, "r_y3": 473.24, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 494.1, "r_x1": 545.12, "r_y1": 494.1, "r_x2": 545.12, "r_y2": 485.19, "r_x3": 308.86, "r_y3": 485.19, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 506.06, "r_x1": 545.12, "r_y1": 506.06, "r_x2": 545.12, "r_y2": 497.15, "r_x3": 308.86, "r_y3": 497.15, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 518.01, "r_x1": 545.12, "r_y1": 518.01, "r_x2": 545.12, "r_y2": 509.11, "r_x3": 308.86, "r_y3": 509.11, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 529.97, "r_x1": 545.12, "r_y1": 529.97, "r_x2": 545.12, "r_y2": 521.06, "r_x3": 308.86, "r_y3": 521.06, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 541.92, "r_x1": 545.12, "r_y1": 541.92, "r_x2": 545.12, "r_y2": 533.02, "r_x3": 308.86, "r_y3": 533.02, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 553.88, "r_x1": 377.22, "r_y1": 553.88, "r_x2": 377.22, "r_y2": 544.97, "r_x3": 308.86, "r_y3": 544.97, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 589.41, "r_x1": 323.9, "r_y1": 589.41, "r_x2": 323.9, "r_y2": 579.55, "r_x3": 308.86, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93, "r_y0": 589.41, "r_x1": 397.44, "r_y1": 589.41, "r_x2": 397.44, "r_y2": 579.55, "r_x3": 333.93, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 612.36, "r_x1": 545.11, "r_y1": 612.36, "r_x2": 545.11, "r_y2": 603.45, "r_x3": 320.82, "r_y3": 603.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 624.31, "r_x1": 545.12, "r_y1": 624.31, "r_x2": 545.12, "r_y2": 615.4, "r_x3": 308.86, "r_y3": 615.4, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 636.27, "r_x1": 545.12, "r_y1": 636.27, "r_x2": 545.12, "r_y2": 627.36, "r_x3": 308.86, "r_y3": 627.36, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 648.22, "r_x1": 545.12, "r_y1": 648.22, "r_x2": 545.12, "r_y2": 639.31, "r_x3": 308.86, "r_y3": 639.31, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 660.18, "r_x1": 545.12, "r_y1": 660.18, "r_x2": 545.12, "r_y2": 651.27, "r_x3": 308.86, "r_y3": 651.27, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 672.13, "r_x1": 350.7, "r_y1": 672.13, "r_x2": 350.7, "r_y2": 663.23, "r_x3": 308.86, "r_y3": 663.23, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 320.82, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 396.21, "r_y1": 701.2, "r_x2": 396.21, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.41, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 406.41, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 495.94, "r_y1": 713.15, "r_x2": 495.94, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 286.37, "r_y1": 96.07, "r_x2": 286.37, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 286.37, "r_y1": 108.02, "r_x2": 286.37, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 119.98, "r_x1": 286.37, "r_y1": 119.98, "r_x2": 286.37, "r_y2": 111.07, "r_x3": 50.11, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.93, "r_x1": 286.37, "r_y1": 131.93, "r_x2": 286.37, "r_y2": 123.03, "r_x3": 50.11, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.89, "r_x1": 286.37, "r_y1": 143.89, "r_x2": 286.37, "r_y2": 134.98, "r_x3": 50.11, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.85, "r_x1": 175.16, "r_y1": 155.85, "r_x2": 175.16, "r_y2": 146.94, "r_x3": 50.11, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 159.62, "r": 286.37, "b": 240.26, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 168.53, "r_x1": 286.36, "r_y1": 168.53, "r_x2": 286.36, "r_y2": 159.62, "r_x3": 62.07, "r_y3": 159.62, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.49, "r_x1": 286.37, "r_y1": 180.49, "r_x2": 286.37, "r_y2": 171.58, "r_x3": 50.11, "r_y3": 171.58, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.44, "r_x1": 286.37, "r_y1": 192.44, "r_x2": 286.37, "r_y2": 183.54, "r_x3": 50.11, "r_y3": 183.54, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.4, "r_x1": 286.37, "r_y1": 204.4, "r_x2": 286.37, "r_y2": 195.49, "r_x3": 50.11, "r_y3": 195.49, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.35, "r_x1": 286.37, "r_y1": 216.35, "r_x2": 286.37, "r_y2": 207.45, "r_x3": 50.11, "r_y3": 207.45, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.31, "r_x1": 286.37, "r_y1": 228.31, "r_x2": 286.37, "r_y2": 219.4, "r_x3": 50.11, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 240.26, "r_x1": 181.55, "r_y1": 240.26, "r_x2": 181.55, "r_y2": 231.36, "r_x3": 50.11, "r_y3": 231.36, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 243.92, "r": 286.37, "b": 444.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.88, "r_x1": 129.21, "r_y1": 252.88, "r_x2": 129.21, "r_y2": 243.92, "r_x3": 62.07, "r_y3": 243.92, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.45, "r_y0": 252.95, "r_x1": 286.36, "r_y1": 252.95, "r_x2": 286.36, "r_y2": 244.04, "r_x3": 134.45, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.9, "r_x1": 286.37, "r_y1": 264.9, "r_x2": 286.37, "r_y2": 256.0, "r_x3": 50.11, "r_y3": 256.0, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.64, "r_x1": 56.85, "r_y1": 276.64, "r_x2": 56.85, "r_y2": 267.79, "r_x3": 50.11, "r_y3": 267.79, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.34, "r_y0": 276.86, "r_x1": 135.4, "r_y1": 276.86, "r_x2": 135.4, "r_y2": 267.95, "r_x3": 57.34, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.74, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04, "r_x3": 137.74, "r_y3": 268.04, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.64, "r_y0": 276.86, "r_x1": 286.36, "r_y1": 276.86, "r_x2": 286.36, "r_y2": 267.95, "r_x3": 213.64, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.81, "r_x1": 158.82, "r_y1": 288.81, "r_x2": 158.82, "r_y2": 279.91, "r_x3": 50.11, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.32, "r_y0": 288.58, "r_x1": 238.8, "r_y1": 288.58, "r_x2": 238.8, "r_y2": 280.0, "r_x3": 161.32, "r_y3": 280.0, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.52, "r_y0": 288.81, "r_x1": 286.36, "r_y1": 288.81, "r_x2": 286.36, "r_y2": 279.91, "r_x3": 241.52, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.77, "r_x1": 211.38, "r_y1": 300.77, "r_x2": 211.38, "r_y2": 291.86, "r_x3": 50.11, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.27, "r_y0": 300.55, "r_x1": 229.2, "r_y1": 300.55, "r_x2": 229.2, "r_y2": 291.7, "r_x3": 214.27, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.7, "r_y0": 300.77, "r_x1": 232.19, "r_y1": 300.77, "r_x2": 232.19, "r_y2": 291.86, "r_x3": 229.7, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49, "r_y0": 300.55, "r_x1": 251.42, "r_y1": 300.55, "r_x2": 251.42, "r_y2": 291.7, "r_x3": 236.49, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81, "r_y0": 300.77, "r_x1": 286.36, "r_y1": 300.77, "r_x2": 286.36, "r_y2": 291.86, "r_x3": 254.81, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.72, "r_x1": 137.45, "r_y1": 312.72, "r_x2": 137.45, "r_y2": 303.82, "r_x3": 50.11, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.3, "r_y0": 312.5, "r_x1": 148.24, "r_y1": 312.5, "r_x2": 148.24, "r_y2": 303.66, "r_x3": 141.3, "r_y3": 303.66, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.59, "r_y0": 312.72, "r_x1": 286.36, "r_y1": 312.72, "r_x2": 286.36, "r_y2": 303.82, "r_x3": 152.59, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.68, "r_x1": 89.68, "r_y1": 324.68, "r_x2": 89.68, "r_y2": 315.77, "r_x3": 50.11, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.69, "r_y0": 324.46, "r_x1": 104.12, "r_y1": 324.46, "r_x2": 104.12, "r_y2": 315.61, "r_x3": 89.69, "r_y3": 315.61, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.62, "r_y0": 324.68, "r_x1": 286.37, "r_y1": 324.68, "r_x2": 286.37, "r_y2": 315.77, "r_x3": 104.62, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.64, "r_x1": 286.37, "r_y1": 336.64, "r_x2": 286.37, "r_y2": 327.73, "r_x3": 50.11, "r_y3": 327.73, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.59, "r_x1": 286.37, "r_y1": 348.59, "r_x2": 286.37, "r_y2": 339.68, "r_x3": 50.11, "r_y3": 339.68, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.54, "r_x1": 286.37, "r_y1": 360.54, "r_x2": 286.37, "r_y2": 351.64, "r_x3": 50.11, "r_y3": 351.64, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.5, "r_x1": 286.37, "r_y1": 372.5, "r_x2": 286.37, "r_y2": 363.59, "r_x3": 50.11, "r_y3": 363.59, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.45, "r_x1": 286.37, "r_y1": 384.45, "r_x2": 286.37, "r_y2": 375.55, "r_x3": 50.11, "r_y3": 375.55, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.41, "r_x1": 286.37, "r_y1": 396.41, "r_x2": 286.37, "r_y2": 387.5, "r_x3": 50.11, "r_y3": 387.5, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.37, "r_x1": 88.69, "r_y1": 408.37, "r_x2": 88.69, "r_y2": 399.46, "r_x3": 50.11, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.65, "r_y0": 408.14, "r_x1": 170.05, "r_y1": 408.14, "r_x2": 170.05, "r_y2": 399.55, "r_x3": 91.65, "r_y3": 399.55, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05, "r_y0": 408.37, "r_x1": 286.36, "r_y1": 408.37, "r_x2": 286.36, "r_y2": 399.46, "r_x3": 170.05, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.32, "r_x1": 181.97, "r_y1": 420.32, "r_x2": 181.97, "r_y2": 411.41, "r_x3": 50.11, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09, "r_y0": 420.32, "r_x1": 197.75, "r_y1": 420.32, "r_x2": 197.75, "r_y2": 411.41, "r_x3": 189.09, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.35, "r_y0": 420.32, "r_x1": 286.37, "r_y1": 420.32, "r_x2": 286.37, "r_y2": 411.41, "r_x3": 200.35, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.28, "r_x1": 286.37, "r_y1": 432.28, "r_x2": 286.37, "r_y2": 423.37, "r_x3": 50.11, "r_y3": 423.37, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.23, "r_x1": 158.3, "r_y1": 444.23, "r_x2": 158.3, "r_y2": 435.32, "r_x3": 50.11, "r_y3": 435.32, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 448.01, "r": 286.36, "b": 468.87, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 456.92, "r_x1": 286.36, "r_y1": 456.92, "r_x2": 286.36, "r_y2": 448.01, "r_x3": 62.07, "r_y3": 448.01, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 468.87, "r_x1": 91.38, "r_y1": 468.87, "r_x2": 91.38, "r_y2": 459.97, "r_x3": 50.11, "r_y3": 459.97, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "formula", "bbox": { "l": 124.33, "t": 493.28, "r": 286.36, "b": 517.07, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.72, "r_y0": 502.13, "r_x1": 140.64, "r_y1": 502.13, "r_x2": 140.64, "r_y2": 493.28, "r_x3": 125.72, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.91, "r_y0": 502.13, "r_x1": 151.66, "r_y1": 502.13, "r_x2": 151.66, "r_y2": 493.28, "r_x3": 143.91, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42, "r_y0": 502.13, "r_x1": 186.63, "r_y1": 502.13, "r_x2": 186.63, "r_y2": 493.28, "r_x3": 154.42, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34, "r_y0": 502.13, "r_x1": 197.09, "r_y1": 502.13, "r_x2": 197.09, "r_y2": 493.28, "r_x3": 189.34, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.3, "r_y0": 502.13, "r_x1": 211.65, "r_y1": 502.13, "r_x2": 211.65, "r_y2": 493.28, "r_x3": 199.3, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33, "r_y0": 517.07, "r_x1": 127.3, "r_y1": 517.07, "r_x2": 127.3, "r_y2": 508.22, "r_x3": 124.33, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.27, "r_y0": 517.07, "r_x1": 138.01, "r_y1": 517.07, "r_x2": 138.01, "r_y2": 508.22, "r_x3": 130.27, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78, "r_y0": 517.07, "r_x1": 153.33, "r_y1": 517.07, "r_x2": 153.33, "r_y2": 508.22, "r_x3": 140.78, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.04, "r_y0": 517.07, "r_x1": 174.86, "r_y1": 517.07, "r_x2": 174.86, "r_y2": 508.22, "r_x3": 156.04, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07, "r_y0": 517.07, "r_x1": 184.82, "r_y1": 517.07, "r_x2": 184.82, "r_y2": 507.67, "r_x3": 177.07, "r_y3": 507.67, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03, "r_y0": 517.07, "r_x1": 192.84, "r_y1": 517.07, "r_x2": 192.84, "r_y2": 508.22, "r_x3": 187.03, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.85, "r_y0": 517.07, "r_x1": 196.72, "r_y1": 517.07, "r_x2": 196.72, "r_y2": 508.22, "r_x3": 192.85, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.72, "r_y0": 517.07, "r_x1": 211.65, "r_y1": 517.07, "r_x2": 211.65, "r_y2": 508.22, "r_x3": 196.72, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 509.92, "r_x1": 286.36, "r_y1": 509.92, "r_x2": 286.36, "r_y2": 501.01, "r_x3": 274.75, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 530.59, "r": 281.6, "b": 540.22, "coord_origin": "TOPLEFT" }, "confidence": 0.936, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 540.22, "r_x1": 74.45, "r_y1": 540.22, "r_x2": 74.45, "r_y2": 531.31, "r_x3": 50.11, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.94, "r_y0": 540.0, "r_x1": 82.75, "r_y1": 540.0, "r_x2": 82.75, "r_y2": 531.15, "r_x3": 76.94, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.52, "r_y0": 540.0, "r_x1": 92.16, "r_y1": 540.0, "r_x2": 92.16, "r_y2": 530.59, "r_x3": 85.52, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.65, "r_y0": 540.22, "r_x1": 135.6, "r_y1": 540.22, "r_x2": 135.6, "r_y2": 531.31, "r_x3": 94.65, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09, "r_y0": 540.0, "r_x1": 172.63, "r_y1": 540.0, "r_x2": 172.63, "r_y2": 531.15, "r_x3": 138.09, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.9, "r_y0": 540.0, "r_x1": 192.5, "r_y1": 540.0, "r_x2": 192.5, "r_y2": 530.59, "r_x3": 175.9, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99, "r_y0": 540.22, "r_x1": 281.6, "r_y1": 540.22, "r_x2": 281.6, "r_y2": 531.31, "r_x3": 194.99, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 555.92, "r": 171.98, "b": 566.66, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 566.66, "r_x1": 57.93, "r_y1": 566.66, "r_x2": 57.93, "r_y2": 555.92, "r_x3": 50.11, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.35, "r_y0": 566.66, "r_x1": 171.98, "r_y1": 566.66, "r_x2": 171.98, "r_y2": 555.92, "r_x3": 68.35, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 576.26, "r": 179.18, "b": 586.12, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.12, "r_x1": 64.69, "r_y1": 586.12, "r_x2": 64.69, "r_y2": 576.26, "r_x3": 50.11, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.41, "r_y0": 586.12, "r_x1": 179.18, "r_y1": 586.12, "r_x2": 179.18, "r_y2": 576.26, "r_x3": 74.41, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 595.73, "r": 286.37, "b": 640.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 604.64, "r_x1": 202.98, "r_y1": 604.64, "r_x2": 202.98, "r_y2": 595.73, "r_x3": 62.07, "r_y3": 595.73, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38, "r_y0": 604.41, "r_x1": 286.36, "r_y1": 604.41, "r_x2": 286.36, "r_y2": 595.82, "r_x3": 205.38, "r_y3": 595.82, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 616.37, "r_x1": 70.04, "r_y1": 616.37, "r_x2": 70.04, "r_y2": 607.78, "r_x3": 50.11, "r_y3": 607.78, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 616.6, "r_x1": 286.36, "r_y1": 616.6, "r_x2": 286.36, "r_y2": 607.69, "r_x3": 70.04, "r_y3": 607.69, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 628.55, "r_x1": 286.37, "r_y1": 628.55, "r_x2": 286.37, "r_y2": 619.64, "r_x3": 50.11, "r_y3": 619.64, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 640.51, "r_x1": 207.03, "r_y1": 640.51, "r_x2": 207.03, "r_y2": 631.6, "r_x3": 50.11, "r_y3": 631.6, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "formula", "bbox": { "l": 91.66, "t": 653.83, "r": 286.36, "b": 678.4, "coord_origin": "TOPLEFT" }, "confidence": 0.844, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.66, "r_y0": 663.45, "r_x1": 186.02, "r_y1": 663.45, "r_x2": 186.02, "r_y2": 654.55, "r_x3": 91.66, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.51, "r_y0": 663.23, "r_x1": 196.26, "r_y1": 663.23, "r_x2": 196.26, "r_y2": 653.83, "r_x3": 188.51, "r_y3": 653.83, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.75, "r_y0": 663.45, "r_x1": 244.81, "r_y1": 663.45, "r_x2": 244.81, "r_y2": 654.55, "r_x3": 198.75, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.02, "r_y0": 678.4, "r_x1": 186.25, "r_y1": 678.4, "r_x2": 186.25, "r_y2": 669.49, "r_x3": 101.02, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.74, "r_y0": 678.18, "r_x1": 196.48, "r_y1": 678.18, "r_x2": 196.48, "r_y2": 668.77, "r_x3": 188.74, "r_y3": 668.77, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.98, "r_y0": 678.4, "r_x1": 244.81, "r_y1": 678.4, "r_x2": 244.81, "r_y2": 669.49, "r_x3": 198.98, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 671.02, "r_x1": 286.36, "r_y1": 671.02, "r_x2": 286.36, "r_y2": 662.12, "r_x3": 274.75, "r_y3": 662.12, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 692.29, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 339.99, "r_y1": 96.07, "r_x2": 339.99, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.89, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 346.89, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 492.96, "r_y1": 108.02, "r_x2": 492.96, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 116.23, "r": 545.12, "b": 328.37, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 125.14, "r_x1": 545.11, "r_y1": 125.14, "r_x2": 545.11, "r_y2": 116.23, "r_x3": 320.82, "r_y3": 116.23, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 137.09, "r_x1": 545.12, "r_y1": 137.09, "r_x2": 545.12, "r_y2": 128.18, "r_x3": 308.86, "r_y3": 128.18, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 149.05, "r_x1": 545.12, "r_y1": 149.05, "r_x2": 545.12, "r_y2": 140.14, "r_x3": 308.86, "r_y3": 140.14, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 161.0, "r_x1": 545.12, "r_y1": 161.0, "r_x2": 545.12, "r_y2": 152.09, "r_x3": 308.86, "r_y3": 152.09, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 172.96, "r_x1": 545.12, "r_y1": 172.96, "r_x2": 545.12, "r_y2": 164.05, "r_x3": 308.86, "r_y3": 164.05, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 184.91, "r_x1": 467.22, "r_y1": 184.91, "r_x2": 467.22, "r_y2": 176.01, "r_x3": 308.86, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.44, "r_y0": 184.91, "r_x1": 545.12, "r_y1": 184.91, "r_x2": 545.12, "r_y2": 176.01, "r_x3": 475.44, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 196.87, "r_x1": 545.12, "r_y1": 196.87, "r_x2": 545.12, "r_y2": 187.96, "r_x3": 308.86, "r_y3": 187.96, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 208.82, "r_x1": 545.12, "r_y1": 208.82, "r_x2": 545.12, "r_y2": 199.92, "r_x3": 308.86, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 220.78, "r_x1": 545.12, "r_y1": 220.78, "r_x2": 545.12, "r_y2": 211.87, "r_x3": 308.86, "r_y3": 211.87, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.73, "r_x1": 545.12, "r_y1": 232.73, "r_x2": 545.12, "r_y2": 223.83, "r_x3": 308.86, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 244.69, "r_x1": 545.12, "r_y1": 244.69, "r_x2": 545.12, "r_y2": 235.78, "r_x3": 308.86, "r_y3": 235.78, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.64, "r_x1": 545.12, "r_y1": 256.64, "r_x2": 545.12, "r_y2": 247.74, "r_x3": 308.86, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.6, "r_x1": 342.34, "r_y1": 268.6, "r_x2": 342.34, "r_y2": 259.69, "r_x3": 308.86, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95, "r_y0": 268.6, "r_x1": 545.12, "r_y1": 268.6, "r_x2": 545.12, "r_y2": 259.69, "r_x3": 348.95, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.55, "r_x1": 545.12, "r_y1": 280.55, "r_x2": 545.12, "r_y2": 271.65, "r_x3": 308.86, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.51, "r_x1": 545.12, "r_y1": 292.51, "r_x2": 545.12, "r_y2": 283.6, "r_x3": 308.86, "r_y3": 283.6, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.46, "r_x1": 545.12, "r_y1": 304.46, "r_x2": 545.12, "r_y2": 295.56, "r_x3": 308.86, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.42, "r_x1": 545.12, "r_y1": 316.42, "r_x2": 545.12, "r_y2": 307.51, "r_x3": 308.86, "r_y3": 307.51, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.37, "r_x1": 532.48, "r_y1": 328.37, "r_x2": 532.48, "r_y2": 319.47, "r_x3": 308.86, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 336.58, "r": 545.12, "b": 429.17, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 345.48, "r_x1": 545.11, "r_y1": 345.48, "r_x2": 545.11, "r_y2": 336.58, "r_x3": 320.82, "r_y3": 336.58, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 357.44, "r_x1": 403.74, "r_y1": 357.44, "r_x2": 403.74, "r_y2": 348.53, "r_x3": 308.86, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.08, "r_y0": 357.21, "r_x1": 503.54, "r_y1": 357.21, "r_x2": 503.54, "r_y2": 348.62, "r_x3": 406.08, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.54, "r_y0": 357.44, "r_x1": 506.03, "r_y1": 357.44, "r_x2": 506.03, "r_y2": 348.53, "r_x3": 503.54, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.4, "r_y0": 357.21, "r_x1": 545.11, "r_y1": 357.21, "r_x2": 545.11, "r_y2": 348.62, "r_x3": 508.4, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 369.16, "r_x1": 343.16, "r_y1": 369.16, "r_x2": 343.16, "r_y2": 360.58, "r_x3": 308.86, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16, "r_y0": 369.39, "r_x1": 362.2, "r_y1": 369.39, "r_x2": 362.2, "r_y2": 360.49, "r_x3": 343.16, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.29, "r_y0": 369.16, "r_x1": 440.94, "r_y1": 369.16, "r_x2": 440.94, "r_y2": 360.58, "r_x3": 364.29, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.94, "r_y0": 369.39, "r_x1": 545.11, "r_y1": 369.39, "r_x2": 545.11, "r_y2": 360.49, "r_x3": 440.94, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 381.35, "r_x1": 545.12, "r_y1": 381.35, "r_x2": 545.12, "r_y2": 372.44, "r_x3": 308.86, "r_y3": 372.44, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 393.31, "r_x1": 545.12, "r_y1": 393.31, "r_x2": 545.12, "r_y2": 384.4, "r_x3": 308.86, "r_y3": 384.4, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 405.04, "r_x1": 314.67, "r_y1": 405.04, "r_x2": 314.67, "r_y2": 396.19, "r_x3": 308.86, "r_y3": 396.19, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.66, "r_y0": 405.26, "r_x1": 360.39, "r_y1": 405.26, "r_x2": 360.39, "r_y2": 396.35, "r_x3": 318.66, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96, "r_y0": 405.26, "r_x1": 545.11, "r_y1": 405.26, "r_x2": 545.11, "r_y2": 396.35, "r_x3": 367.96, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 417.21, "r_x1": 545.12, "r_y1": 417.21, "r_x2": 545.12, "r_y2": 408.31, "r_x3": 308.86, "r_y3": 408.31, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 429.17, "r_x1": 360.97, "r_y1": 429.17, "r_x2": 360.97, "r_y2": 420.26, "r_x3": 308.86, "r_y3": 420.26, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 437.37, "r": 545.12, "b": 553.88, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 446.28, "r_x1": 545.11, "r_y1": 446.28, "r_x2": 545.11, "r_y2": 437.37, "r_x3": 320.82, "r_y3": 437.37, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 458.24, "r_x1": 384.63, "r_y1": 458.24, "r_x2": 384.63, "r_y2": 449.33, "r_x3": 308.86, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 458.24, "r_x1": 545.12, "r_y1": 458.24, "r_x2": 545.12, "r_y2": 449.33, "r_x3": 391.37, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 470.19, "r_x1": 494.01, "r_y1": 470.19, "r_x2": 494.01, "r_y2": 461.28, "r_x3": 308.86, "r_y3": 461.28, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.08, "r_y0": 469.96, "r_x1": 545.11, "r_y1": 469.96, "r_x2": 545.11, "r_y2": 461.37, "r_x3": 498.08, "r_y3": 461.37, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 481.92, "r_x1": 364.44, "r_y1": 481.92, "r_x2": 364.44, "r_y2": 473.33, "r_x3": 308.86, "r_y3": 473.33, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 482.15, "r_x1": 545.11, "r_y1": 482.15, "r_x2": 545.11, "r_y2": 473.24, "r_x3": 367.06, "r_y3": 473.24, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 494.1, "r_x1": 545.12, "r_y1": 494.1, "r_x2": 545.12, "r_y2": 485.19, "r_x3": 308.86, "r_y3": 485.19, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 506.06, "r_x1": 545.12, "r_y1": 506.06, "r_x2": 545.12, "r_y2": 497.15, "r_x3": 308.86, "r_y3": 497.15, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 518.01, "r_x1": 545.12, "r_y1": 518.01, "r_x2": 545.12, "r_y2": 509.11, "r_x3": 308.86, "r_y3": 509.11, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 529.97, "r_x1": 545.12, "r_y1": 529.97, "r_x2": 545.12, "r_y2": 521.06, "r_x3": 308.86, "r_y3": 521.06, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 541.92, "r_x1": 545.12, "r_y1": 541.92, "r_x2": 545.12, "r_y2": 533.02, "r_x3": 308.86, "r_y3": 533.02, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 553.88, "r_x1": 377.22, "r_y1": 553.88, "r_x2": 377.22, "r_y2": 544.97, "r_x3": 308.86, "r_y3": 544.97, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 308.86, "t": 579.55, "r": 397.44, "b": 589.41, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 589.41, "r_x1": 323.9, "r_y1": 589.41, "r_x2": 323.9, "r_y2": 579.55, "r_x3": 308.86, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93, "r_y0": 589.41, "r_x1": 397.44, "r_y1": 589.41, "r_x2": 397.44, "r_y2": 579.55, "r_x3": 333.93, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 603.45, "r": 545.12, "b": 672.13, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 612.36, "r_x1": 545.11, "r_y1": 612.36, "r_x2": 545.11, "r_y2": 603.45, "r_x3": 320.82, "r_y3": 603.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 624.31, "r_x1": 545.12, "r_y1": 624.31, "r_x2": 545.12, "r_y2": 615.4, "r_x3": 308.86, "r_y3": 615.4, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 636.27, "r_x1": 545.12, "r_y1": 636.27, "r_x2": 545.12, "r_y2": 627.36, "r_x3": 308.86, "r_y3": 627.36, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 648.22, "r_x1": 545.12, "r_y1": 648.22, "r_x2": 545.12, "r_y2": 639.31, "r_x3": 308.86, "r_y3": 639.31, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 660.18, "r_x1": 545.12, "r_y1": 660.18, "r_x2": 545.12, "r_y2": 651.27, "r_x3": 308.86, "r_y3": 651.27, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 672.13, "r_x1": 350.7, "r_y1": 672.13, "r_x2": 350.7, "r_y2": 663.23, "r_x3": 308.86, "r_y3": 663.23, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 680.34, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 320.82, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 396.21, "r_y1": 701.2, "r_x2": 396.21, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.41, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 406.41, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 495.94, "r_y1": 713.15, "r_x2": 495.94, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 286.37, "r_y1": 96.07, "r_x2": 286.37, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 286.37, "r_y1": 108.02, "r_x2": 286.37, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 119.98, "r_x1": 286.37, "r_y1": 119.98, "r_x2": 286.37, "r_y2": 111.07, "r_x3": 50.11, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.93, "r_x1": 286.37, "r_y1": 131.93, "r_x2": 286.37, "r_y2": 123.03, "r_x3": 50.11, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.89, "r_x1": 286.37, "r_y1": 143.89, "r_x2": 286.37, "r_y2": 134.98, "r_x3": 50.11, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.85, "r_x1": 175.16, "r_y1": 155.85, "r_x2": 175.16, "r_y2": 146.94, "r_x3": 50.11, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 159.62, "r": 286.37, "b": 240.26, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 168.53, "r_x1": 286.36, "r_y1": 168.53, "r_x2": 286.36, "r_y2": 159.62, "r_x3": 62.07, "r_y3": 159.62, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.49, "r_x1": 286.37, "r_y1": 180.49, "r_x2": 286.37, "r_y2": 171.58, "r_x3": 50.11, "r_y3": 171.58, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.44, "r_x1": 286.37, "r_y1": 192.44, "r_x2": 286.37, "r_y2": 183.54, "r_x3": 50.11, "r_y3": 183.54, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.4, "r_x1": 286.37, "r_y1": 204.4, "r_x2": 286.37, "r_y2": 195.49, "r_x3": 50.11, "r_y3": 195.49, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.35, "r_x1": 286.37, "r_y1": 216.35, "r_x2": 286.37, "r_y2": 207.45, "r_x3": 50.11, "r_y3": 207.45, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.31, "r_x1": 286.37, "r_y1": 228.31, "r_x2": 286.37, "r_y2": 219.4, "r_x3": 50.11, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 240.26, "r_x1": 181.55, "r_y1": 240.26, "r_x2": 181.55, "r_y2": 231.36, "r_x3": 50.11, "r_y3": 231.36, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer." }, { "label": "text", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 243.92, "r": 286.37, "b": 444.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.88, "r_x1": 129.21, "r_y1": 252.88, "r_x2": 129.21, "r_y2": 243.92, "r_x3": 62.07, "r_y3": 243.92, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.45, "r_y0": 252.95, "r_x1": 286.36, "r_y1": 252.95, "r_x2": 286.36, "r_y2": 244.04, "r_x3": 134.45, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.9, "r_x1": 286.37, "r_y1": 264.9, "r_x2": 286.37, "r_y2": 256.0, "r_x3": 50.11, "r_y3": 256.0, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.64, "r_x1": 56.85, "r_y1": 276.64, "r_x2": 56.85, "r_y2": 267.79, "r_x3": 50.11, "r_y3": 267.79, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.34, "r_y0": 276.86, "r_x1": 135.4, "r_y1": 276.86, "r_x2": 135.4, "r_y2": 267.95, "r_x3": 57.34, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.74, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04, "r_x3": 137.74, "r_y3": 268.04, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.64, "r_y0": 276.86, "r_x1": 286.36, "r_y1": 276.86, "r_x2": 286.36, "r_y2": 267.95, "r_x3": 213.64, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.81, "r_x1": 158.82, "r_y1": 288.81, "r_x2": 158.82, "r_y2": 279.91, "r_x3": 50.11, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.32, "r_y0": 288.58, "r_x1": 238.8, "r_y1": 288.58, "r_x2": 238.8, "r_y2": 280.0, "r_x3": 161.32, "r_y3": 280.0, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.52, "r_y0": 288.81, "r_x1": 286.36, "r_y1": 288.81, "r_x2": 286.36, "r_y2": 279.91, "r_x3": 241.52, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.77, "r_x1": 211.38, "r_y1": 300.77, "r_x2": 211.38, "r_y2": 291.86, "r_x3": 50.11, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.27, "r_y0": 300.55, "r_x1": 229.2, "r_y1": 300.55, "r_x2": 229.2, "r_y2": 291.7, "r_x3": 214.27, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.7, "r_y0": 300.77, "r_x1": 232.19, "r_y1": 300.77, "r_x2": 232.19, "r_y2": 291.86, "r_x3": 229.7, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49, "r_y0": 300.55, "r_x1": 251.42, "r_y1": 300.55, "r_x2": 251.42, "r_y2": 291.7, "r_x3": 236.49, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81, "r_y0": 300.77, "r_x1": 286.36, "r_y1": 300.77, "r_x2": 286.36, "r_y2": 291.86, "r_x3": 254.81, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.72, "r_x1": 137.45, "r_y1": 312.72, "r_x2": 137.45, "r_y2": 303.82, "r_x3": 50.11, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.3, "r_y0": 312.5, "r_x1": 148.24, "r_y1": 312.5, "r_x2": 148.24, "r_y2": 303.66, "r_x3": 141.3, "r_y3": 303.66, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.59, "r_y0": 312.72, "r_x1": 286.36, "r_y1": 312.72, "r_x2": 286.36, "r_y2": 303.82, "r_x3": 152.59, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.68, "r_x1": 89.68, "r_y1": 324.68, "r_x2": 89.68, "r_y2": 315.77, "r_x3": 50.11, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.69, "r_y0": 324.46, "r_x1": 104.12, "r_y1": 324.46, "r_x2": 104.12, "r_y2": 315.61, "r_x3": 89.69, "r_y3": 315.61, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.62, "r_y0": 324.68, "r_x1": 286.37, "r_y1": 324.68, "r_x2": 286.37, "r_y2": 315.77, "r_x3": 104.62, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.64, "r_x1": 286.37, "r_y1": 336.64, "r_x2": 286.37, "r_y2": 327.73, "r_x3": 50.11, "r_y3": 327.73, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.59, "r_x1": 286.37, "r_y1": 348.59, "r_x2": 286.37, "r_y2": 339.68, "r_x3": 50.11, "r_y3": 339.68, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.54, "r_x1": 286.37, "r_y1": 360.54, "r_x2": 286.37, "r_y2": 351.64, "r_x3": 50.11, "r_y3": 351.64, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.5, "r_x1": 286.37, "r_y1": 372.5, "r_x2": 286.37, "r_y2": 363.59, "r_x3": 50.11, "r_y3": 363.59, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.45, "r_x1": 286.37, "r_y1": 384.45, "r_x2": 286.37, "r_y2": 375.55, "r_x3": 50.11, "r_y3": 375.55, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.41, "r_x1": 286.37, "r_y1": 396.41, "r_x2": 286.37, "r_y2": 387.5, "r_x3": 50.11, "r_y3": 387.5, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.37, "r_x1": 88.69, "r_y1": 408.37, "r_x2": 88.69, "r_y2": 399.46, "r_x3": 50.11, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.65, "r_y0": 408.14, "r_x1": 170.05, "r_y1": 408.14, "r_x2": 170.05, "r_y2": 399.55, "r_x3": 91.65, "r_y3": 399.55, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05, "r_y0": 408.37, "r_x1": 286.36, "r_y1": 408.37, "r_x2": 286.36, "r_y2": 399.46, "r_x3": 170.05, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.32, "r_x1": 181.97, "r_y1": 420.32, "r_x2": 181.97, "r_y2": 411.41, "r_x3": 50.11, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09, "r_y0": 420.32, "r_x1": 197.75, "r_y1": 420.32, "r_x2": 197.75, "r_y2": 411.41, "r_x3": 189.09, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.35, "r_y0": 420.32, "r_x1": 286.37, "r_y1": 420.32, "r_x2": 286.37, "r_y2": 411.41, "r_x3": 200.35, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.28, "r_x1": 286.37, "r_y1": 432.28, "r_x2": 286.37, "r_y2": 423.37, "r_x3": 50.11, "r_y3": 423.37, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.23, "r_x1": 158.3, "r_y1": 444.23, "r_x2": 158.3, "r_y2": 435.32, "r_x3": 50.11, "r_y3": 435.32, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets." }, { "label": "text", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 448.01, "r": 286.36, "b": 468.87, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 456.92, "r_x1": 286.36, "r_y1": 456.92, "r_x2": 286.36, "r_y2": 448.01, "r_x3": 62.07, "r_y3": 448.01, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 468.87, "r_x1": 91.38, "r_y1": 468.87, "r_x2": 91.38, "r_y2": 459.97, "r_x3": 50.11, "r_y3": 459.97, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The loss used to train the TableFormer can be defined as following:" }, { "label": "formula", "id": 15, "page_no": 5, "cluster": { "id": 15, "label": "formula", "bbox": { "l": 124.33, "t": 493.28, "r": 286.36, "b": 517.07, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.72, "r_y0": 502.13, "r_x1": 140.64, "r_y1": 502.13, "r_x2": 140.64, "r_y2": 493.28, "r_x3": 125.72, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.91, "r_y0": 502.13, "r_x1": 151.66, "r_y1": 502.13, "r_x2": 151.66, "r_y2": 493.28, "r_x3": 143.91, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42, "r_y0": 502.13, "r_x1": 186.63, "r_y1": 502.13, "r_x2": 186.63, "r_y2": 493.28, "r_x3": 154.42, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34, "r_y0": 502.13, "r_x1": 197.09, "r_y1": 502.13, "r_x2": 197.09, "r_y2": 493.28, "r_x3": 189.34, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.3, "r_y0": 502.13, "r_x1": 211.65, "r_y1": 502.13, "r_x2": 211.65, "r_y2": 493.28, "r_x3": 199.3, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33, "r_y0": 517.07, "r_x1": 127.3, "r_y1": 517.07, "r_x2": 127.3, "r_y2": 508.22, "r_x3": 124.33, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.27, "r_y0": 517.07, "r_x1": 138.01, "r_y1": 517.07, "r_x2": 138.01, "r_y2": 508.22, "r_x3": 130.27, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78, "r_y0": 517.07, "r_x1": 153.33, "r_y1": 517.07, "r_x2": 153.33, "r_y2": 508.22, "r_x3": 140.78, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.04, "r_y0": 517.07, "r_x1": 174.86, "r_y1": 517.07, "r_x2": 174.86, "r_y2": 508.22, "r_x3": 156.04, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07, "r_y0": 517.07, "r_x1": 184.82, "r_y1": 517.07, "r_x2": 184.82, "r_y2": 507.67, "r_x3": 177.07, "r_y3": 507.67, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03, "r_y0": 517.07, "r_x1": 192.84, "r_y1": 517.07, "r_x2": 192.84, "r_y2": 508.22, "r_x3": 187.03, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.85, "r_y0": 517.07, "r_x1": 196.72, "r_y1": 517.07, "r_x2": 196.72, "r_y2": 508.22, "r_x3": 192.85, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.72, "r_y0": 517.07, "r_x1": 211.65, "r_y1": 517.07, "r_x2": 211.65, "r_y2": 508.22, "r_x3": 196.72, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 509.92, "r_x1": 286.36, "r_y1": 509.92, "r_x2": 286.36, "r_y2": 501.01, "r_x3": 274.75, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)" }, { "label": "text", "id": 16, "page_no": 5, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 530.59, "r": 281.6, "b": 540.22, "coord_origin": "TOPLEFT" }, "confidence": 0.936, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 540.22, "r_x1": 74.45, "r_y1": 540.22, "r_x2": 74.45, "r_y2": 531.31, "r_x3": 50.11, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.94, "r_y0": 540.0, "r_x1": 82.75, "r_y1": 540.0, "r_x2": 82.75, "r_y2": 531.15, "r_x3": 76.94, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.52, "r_y0": 540.0, "r_x1": 92.16, "r_y1": 540.0, "r_x2": 92.16, "r_y2": 530.59, "r_x3": 85.52, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.65, "r_y0": 540.22, "r_x1": 135.6, "r_y1": 540.22, "r_x2": 135.6, "r_y2": 531.31, "r_x3": 94.65, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09, "r_y0": 540.0, "r_x1": 172.63, "r_y1": 540.0, "r_x2": 172.63, "r_y2": 531.15, "r_x3": 138.09, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.9, "r_y0": 540.0, "r_x1": 192.5, "r_y1": 540.0, "r_x2": 192.5, "r_y2": 530.59, "r_x3": 175.9, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99, "r_y0": 540.22, "r_x1": 281.6, "r_y1": 540.22, "r_x2": 281.6, "r_y2": 531.31, "r_x3": 194.99, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters." }, { "label": "section_header", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 555.92, "r": 171.98, "b": 566.66, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 566.66, "r_x1": 57.93, "r_y1": 566.66, "r_x2": 57.93, "r_y2": 555.92, "r_x3": 50.11, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.35, "r_y0": 566.66, "r_x1": 171.98, "r_y1": 566.66, "r_x2": 171.98, "r_y2": 555.92, "r_x3": 68.35, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Experimental Results" }, { "label": "section_header", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 576.26, "r": 179.18, "b": 586.12, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.12, "r_x1": 64.69, "r_y1": 586.12, "r_x2": 64.69, "r_y2": 576.26, "r_x3": 50.11, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.41, "r_y0": 586.12, "r_x1": 179.18, "r_y1": 586.12, "r_x2": 179.18, "r_y2": 576.26, "r_x3": 74.41, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1. Implementation Details" }, { "label": "text", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 595.73, "r": 286.37, "b": 640.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 604.64, "r_x1": 202.98, "r_y1": 604.64, "r_x2": 202.98, "r_y2": 595.73, "r_x3": 62.07, "r_y3": 595.73, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38, "r_y0": 604.41, "r_x1": 286.36, "r_y1": 604.41, "r_x2": 286.36, "r_y2": 595.82, "r_x3": 205.38, "r_y3": 595.82, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 616.37, "r_x1": 70.04, "r_y1": 616.37, "r_x2": 70.04, "r_y2": 607.78, "r_x3": 50.11, "r_y3": 607.78, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 616.6, "r_x1": 286.36, "r_y1": 616.6, "r_x2": 286.36, "r_y2": 607.69, "r_x3": 70.04, "r_y3": 607.69, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 628.55, "r_x1": 286.37, "r_y1": 628.55, "r_x2": 286.37, "r_y2": 619.64, "r_x3": 50.11, "r_y3": 619.64, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 640.51, "r_x1": 207.03, "r_y1": 640.51, "r_x2": 207.03, "r_y2": 631.6, "r_x3": 50.11, "r_y3": 631.6, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:" }, { "label": "formula", "id": 18, "page_no": 5, "cluster": { "id": 18, "label": "formula", "bbox": { "l": 91.66, "t": 653.83, "r": 286.36, "b": 678.4, "coord_origin": "TOPLEFT" }, "confidence": 0.844, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.66, "r_y0": 663.45, "r_x1": 186.02, "r_y1": 663.45, "r_x2": 186.02, "r_y2": 654.55, "r_x3": 91.66, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.51, "r_y0": 663.23, "r_x1": 196.26, "r_y1": 663.23, "r_x2": 196.26, "r_y2": 653.83, "r_x3": 188.51, "r_y3": 653.83, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.75, "r_y0": 663.45, "r_x1": 244.81, "r_y1": 663.45, "r_x2": 244.81, "r_y2": 654.55, "r_x3": 198.75, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.02, "r_y0": 678.4, "r_x1": 186.25, "r_y1": 678.4, "r_x2": 186.25, "r_y2": 669.49, "r_x3": 101.02, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.74, "r_y0": 678.18, "r_x1": 196.48, "r_y1": 678.18, "r_x2": 196.48, "r_y2": 668.77, "r_x3": 188.74, "r_y3": 668.77, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.98, "r_y0": 678.4, "r_x1": 244.81, "r_y1": 678.4, "r_x2": 244.81, "r_y2": 669.49, "r_x3": 198.98, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 671.02, "r_x1": 286.36, "r_y1": 671.02, "r_x2": 286.36, "r_y2": 662.12, "r_x3": 274.75, "r_y3": 662.12, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)" }, { "label": "text", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 692.29, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved" }, { "label": "text", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 339.99, "r_y1": 96.07, "r_x2": 339.99, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.89, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 346.89, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 492.96, "r_y1": 108.02, "r_x2": 492.96, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 116.23, "r": 545.12, "b": 328.37, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 125.14, "r_x1": 545.11, "r_y1": 125.14, "r_x2": 545.11, "r_y2": 116.23, "r_x3": 320.82, "r_y3": 116.23, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 137.09, "r_x1": 545.12, "r_y1": 137.09, "r_x2": 545.12, "r_y2": 128.18, "r_x3": 308.86, "r_y3": 128.18, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 149.05, "r_x1": 545.12, "r_y1": 149.05, "r_x2": 545.12, "r_y2": 140.14, "r_x3": 308.86, "r_y3": 140.14, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 161.0, "r_x1": 545.12, "r_y1": 161.0, "r_x2": 545.12, "r_y2": 152.09, "r_x3": 308.86, "r_y3": 152.09, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 172.96, "r_x1": 545.12, "r_y1": 172.96, "r_x2": 545.12, "r_y2": 164.05, "r_x3": 308.86, "r_y3": 164.05, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 184.91, "r_x1": 467.22, "r_y1": 184.91, "r_x2": 467.22, "r_y2": 176.01, "r_x3": 308.86, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.44, "r_y0": 184.91, "r_x1": 545.12, "r_y1": 184.91, "r_x2": 545.12, "r_y2": 176.01, "r_x3": 475.44, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 196.87, "r_x1": 545.12, "r_y1": 196.87, "r_x2": 545.12, "r_y2": 187.96, "r_x3": 308.86, "r_y3": 187.96, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 208.82, "r_x1": 545.12, "r_y1": 208.82, "r_x2": 545.12, "r_y2": 199.92, "r_x3": 308.86, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 220.78, "r_x1": 545.12, "r_y1": 220.78, "r_x2": 545.12, "r_y2": 211.87, "r_x3": 308.86, "r_y3": 211.87, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.73, "r_x1": 545.12, "r_y1": 232.73, "r_x2": 545.12, "r_y2": 223.83, "r_x3": 308.86, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 244.69, "r_x1": 545.12, "r_y1": 244.69, "r_x2": 545.12, "r_y2": 235.78, "r_x3": 308.86, "r_y3": 235.78, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.64, "r_x1": 545.12, "r_y1": 256.64, "r_x2": 545.12, "r_y2": 247.74, "r_x3": 308.86, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.6, "r_x1": 342.34, "r_y1": 268.6, "r_x2": 342.34, "r_y2": 259.69, "r_x3": 308.86, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95, "r_y0": 268.6, "r_x1": 545.12, "r_y1": 268.6, "r_x2": 545.12, "r_y2": 259.69, "r_x3": 348.95, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.55, "r_x1": 545.12, "r_y1": 280.55, "r_x2": 545.12, "r_y2": 271.65, "r_x3": 308.86, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.51, "r_x1": 545.12, "r_y1": 292.51, "r_x2": 545.12, "r_y2": 283.6, "r_x3": 308.86, "r_y3": 283.6, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.46, "r_x1": 545.12, "r_y1": 304.46, "r_x2": 545.12, "r_y2": 295.56, "r_x3": 308.86, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.42, "r_x1": 545.12, "r_y1": 316.42, "r_x2": 545.12, "r_y2": 307.51, "r_x3": 308.86, "r_y3": 307.51, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.37, "r_x1": 532.48, "r_y1": 328.37, "r_x2": 532.48, "r_y2": 319.47, "r_x3": 308.86, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 336.58, "r": 545.12, "b": 429.17, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 345.48, "r_x1": 545.11, "r_y1": 345.48, "r_x2": 545.11, "r_y2": 336.58, "r_x3": 320.82, "r_y3": 336.58, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 357.44, "r_x1": 403.74, "r_y1": 357.44, "r_x2": 403.74, "r_y2": 348.53, "r_x3": 308.86, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.08, "r_y0": 357.21, "r_x1": 503.54, "r_y1": 357.21, "r_x2": 503.54, "r_y2": 348.62, "r_x3": 406.08, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.54, "r_y0": 357.44, "r_x1": 506.03, "r_y1": 357.44, "r_x2": 506.03, "r_y2": 348.53, "r_x3": 503.54, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.4, "r_y0": 357.21, "r_x1": 545.11, "r_y1": 357.21, "r_x2": 545.11, "r_y2": 348.62, "r_x3": 508.4, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 369.16, "r_x1": 343.16, "r_y1": 369.16, "r_x2": 343.16, "r_y2": 360.58, "r_x3": 308.86, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16, "r_y0": 369.39, "r_x1": 362.2, "r_y1": 369.39, "r_x2": 362.2, "r_y2": 360.49, "r_x3": 343.16, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.29, "r_y0": 369.16, "r_x1": 440.94, "r_y1": 369.16, "r_x2": 440.94, "r_y2": 360.58, "r_x3": 364.29, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.94, "r_y0": 369.39, "r_x1": 545.11, "r_y1": 369.39, "r_x2": 545.11, "r_y2": 360.49, "r_x3": 440.94, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 381.35, "r_x1": 545.12, "r_y1": 381.35, "r_x2": 545.12, "r_y2": 372.44, "r_x3": 308.86, "r_y3": 372.44, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 393.31, "r_x1": 545.12, "r_y1": 393.31, "r_x2": 545.12, "r_y2": 384.4, "r_x3": 308.86, "r_y3": 384.4, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 405.04, "r_x1": 314.67, "r_y1": 405.04, "r_x2": 314.67, "r_y2": 396.19, "r_x3": 308.86, "r_y3": 396.19, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.66, "r_y0": 405.26, "r_x1": 360.39, "r_y1": 405.26, "r_x2": 360.39, "r_y2": 396.35, "r_x3": 318.66, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96, "r_y0": 405.26, "r_x1": 545.11, "r_y1": 405.26, "r_x2": 545.11, "r_y2": 396.35, "r_x3": 367.96, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 417.21, "r_x1": 545.12, "r_y1": 417.21, "r_x2": 545.12, "r_y2": 408.31, "r_x3": 308.86, "r_y3": 408.31, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 429.17, "r_x1": 360.97, "r_y1": 429.17, "r_x2": 360.97, "r_y2": 420.26, "r_x3": 308.86, "r_y3": 420.26, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence." }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 437.37, "r": 545.12, "b": 553.88, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 446.28, "r_x1": 545.11, "r_y1": 446.28, "r_x2": 545.11, "r_y2": 437.37, "r_x3": 320.82, "r_y3": 437.37, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 458.24, "r_x1": 384.63, "r_y1": 458.24, "r_x2": 384.63, "r_y2": 449.33, "r_x3": 308.86, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 458.24, "r_x1": 545.12, "r_y1": 458.24, "r_x2": 545.12, "r_y2": 449.33, "r_x3": 391.37, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 470.19, "r_x1": 494.01, "r_y1": 470.19, "r_x2": 494.01, "r_y2": 461.28, "r_x3": 308.86, "r_y3": 461.28, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.08, "r_y0": 469.96, "r_x1": 545.11, "r_y1": 469.96, "r_x2": 545.11, "r_y2": 461.37, "r_x3": 498.08, "r_y3": 461.37, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 481.92, "r_x1": 364.44, "r_y1": 481.92, "r_x2": 364.44, "r_y2": 473.33, "r_x3": 308.86, "r_y3": 473.33, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 482.15, "r_x1": 545.11, "r_y1": 482.15, "r_x2": 545.11, "r_y2": 473.24, "r_x3": 367.06, "r_y3": 473.24, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 494.1, "r_x1": 545.12, "r_y1": 494.1, "r_x2": 545.12, "r_y2": 485.19, "r_x3": 308.86, "r_y3": 485.19, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 506.06, "r_x1": 545.12, "r_y1": 506.06, "r_x2": 545.12, "r_y2": 497.15, "r_x3": 308.86, "r_y3": 497.15, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 518.01, "r_x1": 545.12, "r_y1": 518.01, "r_x2": 545.12, "r_y2": 509.11, "r_x3": 308.86, "r_y3": 509.11, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 529.97, "r_x1": 545.12, "r_y1": 529.97, "r_x2": 545.12, "r_y2": 521.06, "r_x3": 308.86, "r_y3": 521.06, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 541.92, "r_x1": 545.12, "r_y1": 541.92, "r_x2": 545.12, "r_y2": 533.02, "r_x3": 308.86, "r_y3": 533.02, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 553.88, "r_x1": 377.22, "r_y1": 553.88, "r_x2": 377.22, "r_y2": 544.97, "r_x3": 308.86, "r_y3": 544.97, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag." }, { "label": "section_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 308.86, "t": 579.55, "r": 397.44, "b": 589.41, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 589.41, "r_x1": 323.9, "r_y1": 589.41, "r_x2": 323.9, "r_y2": 579.55, "r_x3": 308.86, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93, "r_y0": 589.41, "r_x1": 397.44, "r_y1": 589.41, "r_x2": 397.44, "r_y2": 579.55, "r_x3": 333.93, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2. Generalization" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 603.45, "r": 545.12, "b": 672.13, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 612.36, "r_x1": 545.11, "r_y1": 612.36, "r_x2": 545.11, "r_y2": 603.45, "r_x3": 320.82, "r_y3": 603.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 624.31, "r_x1": 545.12, "r_y1": 624.31, "r_x2": 545.12, "r_y2": 615.4, "r_x3": 308.86, "r_y3": 615.4, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 636.27, "r_x1": 545.12, "r_y1": 636.27, "r_x2": 545.12, "r_y2": 627.36, "r_x3": 308.86, "r_y3": 627.36, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 648.22, "r_x1": 545.12, "r_y1": 648.22, "r_x2": 545.12, "r_y2": 639.31, "r_x3": 308.86, "r_y3": 639.31, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 660.18, "r_x1": 545.12, "r_y1": 660.18, "r_x2": 545.12, "r_y2": 651.27, "r_x3": 308.86, "r_y3": 651.27, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 672.13, "r_x1": 350.7, "r_y1": 672.13, "r_x2": 350.7, "r_y2": 663.23, "r_x3": 308.86, "r_y3": 663.23, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively." }, { "label": "text", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 680.34, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 320.82, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 396.21, "r_y1": 701.2, "r_x2": 396.21, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.41, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 406.41, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 495.94, "r_y1": 713.15, "r_x2": 495.94, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized." }, { "label": "page_footer", "id": 17, "page_no": 5, "cluster": { "id": 17, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" } ], "body": [ { "label": "text", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 286.37, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 286.37, "r_y1": 84.11, "r_x2": 286.37, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 96.07, "r_x1": 286.37, "r_y1": 96.07, "r_x2": 286.37, "r_y2": 87.16, "r_x3": 50.11, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 286.37, "r_y1": 108.02, "r_x2": 286.37, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 119.98, "r_x1": 286.37, "r_y1": 119.98, "r_x2": 286.37, "r_y2": 111.07, "r_x3": 50.11, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.93, "r_x1": 286.37, "r_y1": 131.93, "r_x2": 286.37, "r_y2": 123.03, "r_x3": 50.11, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "of objects may exist. In our case, we know up front that", "orig": "of objects may exist. In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 143.89, "r_x1": 286.37, "r_y1": 143.89, "r_x2": 286.37, "r_y2": 134.98, "r_x3": 50.11, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 155.85, "r_x1": 175.16, "r_y1": 155.85, "r_x2": 175.16, "r_y2": 146.94, "r_x3": 50.11, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 159.62, "r": 286.37, "b": 240.26, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 168.53, "r_x1": 286.36, "r_y1": 168.53, "r_x2": 286.36, "r_y2": 159.62, "r_x3": 62.07, "r_y3": 159.62, "coord_origin": "TOPLEFT" }, "text": "The output features for each table cell are then fed", "orig": "The output features for each table cell are then fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 180.49, "r_x1": 286.37, "r_y1": 180.49, "r_x2": 286.37, "r_y2": 171.58, "r_x3": 50.11, "r_y3": 171.58, "coord_origin": "TOPLEFT" }, "text": "into the feed-forward network (FFN). The FFN consists", "orig": "into the feed-forward network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 192.44, "r_x1": 286.37, "r_y1": 192.44, "r_x2": 286.37, "r_y2": 183.54, "r_x3": 50.11, "r_y3": 183.54, "coord_origin": "TOPLEFT" }, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 204.4, "r_x1": 286.37, "r_y1": 204.4, "r_x2": 286.37, "r_y2": 195.49, "r_x3": 50.11, "r_y3": 195.49, "coord_origin": "TOPLEFT" }, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 216.35, "r_x1": 286.37, "r_y1": 216.35, "r_x2": 286.37, "r_y2": 207.45, "r_x3": 50.11, "r_y3": 207.45, "coord_origin": "TOPLEFT" }, "text": "the bounding box of each table cell. Finally, the predicted", "orig": "the bounding box of each table cell. Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 228.31, "r_x1": 286.37, "r_y1": 228.31, "r_x2": 286.37, "r_y2": 219.4, "r_x3": 50.11, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 240.26, "r_x1": 181.55, "r_y1": 240.26, "r_x2": 181.55, "r_y2": 231.36, "r_x3": 50.11, "r_y3": 231.36, "coord_origin": "TOPLEFT" }, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer." }, { "label": "text", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "text", "bbox": { "l": 50.11, "t": 243.92, "r": 286.37, "b": 444.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.88, "r_x1": 129.21, "r_y1": 252.88, "r_x2": 129.21, "r_y2": 243.92, "r_x3": 62.07, "r_y3": 243.92, "coord_origin": "TOPLEFT" }, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.45, "r_y0": 252.95, "r_x1": 286.36, "r_y1": 252.95, "r_x2": 286.36, "r_y2": 244.04, "r_x3": 134.45, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "We formulate a multi-task loss Eq. 2", "orig": "We formulate a multi-task loss Eq. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.9, "r_x1": 286.37, "r_y1": 264.9, "r_x2": 286.37, "r_y2": 256.0, "r_x3": 50.11, "r_y3": 256.0, "coord_origin": "TOPLEFT" }, "text": "to train our network. The Cross-Entropy loss (denoted as", "orig": "to train our network. The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.64, "r_x1": 56.85, "r_y1": 276.64, "r_x2": 56.85, "r_y2": 267.79, "r_x3": 50.11, "r_y3": 267.79, "coord_origin": "TOPLEFT" }, "text": "l$_{s}$", "orig": "l$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 57.34, "r_y0": 276.86, "r_x1": 135.4, "r_y1": 276.86, "r_x2": 135.4, "r_y2": 267.95, "r_x3": 57.34, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.74, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04, "r_x3": 137.74, "r_y3": 268.04, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.64, "r_y0": 276.86, "r_x1": 286.36, "r_y1": 276.86, "r_x2": 286.36, "r_y2": 267.95, "r_x3": 213.64, "r_y3": 267.95, "coord_origin": "TOPLEFT" }, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.81, "r_x1": 158.82, "r_y1": 288.81, "r_x2": 158.82, "r_y2": 279.91, "r_x3": 50.11, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.32, "r_y0": 288.58, "r_x1": 238.8, "r_y1": 288.58, "r_x2": 238.8, "r_y2": 280.0, "r_x3": 161.32, "r_y3": 280.0, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.52, "r_y0": 288.81, "r_x1": 286.36, "r_y1": 288.81, "r_x2": 286.36, "r_y2": 279.91, "r_x3": 241.52, "r_y3": 279.91, "coord_origin": "TOPLEFT" }, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.77, "r_x1": 211.38, "r_y1": 300.77, "r_x2": 211.38, "r_y2": 291.86, "r_x3": 50.11, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.27, "r_y0": 300.55, "r_x1": 229.2, "r_y1": 300.55, "r_x2": 229.2, "r_y2": 291.7, "r_x3": 214.27, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.7, "r_y0": 300.77, "r_x1": 232.19, "r_y1": 300.77, "r_x2": 232.19, "r_y2": 291.86, "r_x3": 229.7, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.49, "r_y0": 300.55, "r_x1": 251.42, "r_y1": 300.55, "r_x2": 251.42, "r_y2": 291.7, "r_x3": 236.49, "r_y3": 291.7, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.81, "r_y0": 300.77, "r_x1": 286.36, "r_y1": 300.77, "r_x2": 286.36, "r_y2": 291.86, "r_x3": 254.81, "r_y3": 291.86, "coord_origin": "TOPLEFT" }, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.72, "r_x1": 137.45, "r_y1": 312.72, "r_x2": 137.45, "r_y2": 303.82, "r_x3": 50.11, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.3, "r_y0": 312.5, "r_x1": 148.24, "r_y1": 312.5, "r_x2": 148.24, "r_y2": 303.66, "r_x3": 141.3, "r_y3": 303.66, "coord_origin": "TOPLEFT" }, "text": "l$_{1}$", "orig": "l$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.59, "r_y0": 312.72, "r_x1": 286.36, "r_y1": 312.72, "r_x2": 286.36, "r_y2": 303.82, "r_x3": 152.59, "r_y3": 303.82, "coord_origin": "TOPLEFT" }, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.68, "r_x1": 89.68, "r_y1": 324.68, "r_x2": 89.68, "r_y2": 315.77, "r_x3": 50.11, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.69, "r_y0": 324.46, "r_x1": 104.12, "r_y1": 324.46, "r_x2": 104.12, "r_y2": 315.61, "r_x3": 89.69, "r_y3": 315.61, "coord_origin": "TOPLEFT" }, "text": "l$_{iou}$", "orig": "l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.62, "r_y0": 324.68, "r_x1": 286.37, "r_y1": 324.68, "r_x2": 286.37, "r_y2": 315.77, "r_x3": 104.62, "r_y3": 315.77, "coord_origin": "TOPLEFT" }, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.64, "r_x1": 286.37, "r_y1": 336.64, "r_x2": 286.37, "r_y2": 327.73, "r_x3": 50.11, "r_y3": 327.73, "coord_origin": "TOPLEFT" }, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.59, "r_x1": 286.37, "r_y1": 348.59, "r_x2": 286.37, "r_y2": 339.68, "r_x3": 50.11, "r_y3": 339.68, "coord_origin": "TOPLEFT" }, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.54, "r_x1": 286.37, "r_y1": 360.54, "r_x2": 286.37, "r_y2": 351.64, "r_x3": 50.11, "r_y3": 351.64, "coord_origin": "TOPLEFT" }, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.5, "r_x1": 286.37, "r_y1": 372.5, "r_x2": 286.37, "r_y2": 363.59, "r_x3": 50.11, "r_y3": 363.59, "coord_origin": "TOPLEFT" }, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.45, "r_x1": 286.37, "r_y1": 384.45, "r_x2": 286.37, "r_y2": 375.55, "r_x3": 50.11, "r_y3": 375.55, "coord_origin": "TOPLEFT" }, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.41, "r_x1": 286.37, "r_y1": 396.41, "r_x2": 286.37, "r_y2": 387.5, "r_x3": 50.11, "r_y3": 387.5, "coord_origin": "TOPLEFT" }, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 408.37, "r_x1": 88.69, "r_y1": 408.37, "r_x2": 88.69, "r_y2": 399.46, "r_x3": 50.11, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.65, "r_y0": 408.14, "r_x1": 170.05, "r_y1": 408.14, "r_x2": 170.05, "r_y2": 399.55, "r_x3": 91.65, "r_y3": 399.55, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.05, "r_y0": 408.37, "r_x1": 286.36, "r_y1": 408.37, "r_x2": 286.36, "r_y2": 399.46, "r_x3": 170.05, "r_y3": 399.46, "coord_origin": "TOPLEFT" }, "text": ", and 2) Our bounding boxes", "orig": ", and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 420.32, "r_x1": 181.97, "r_y1": 420.32, "r_x2": 181.97, "r_y2": 411.41, "r_x3": 50.11, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.09, "r_y0": 420.32, "r_x1": 197.75, "r_y1": 420.32, "r_x2": 197.75, "r_y2": 411.41, "r_x3": 189.09, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "3)", "orig": "3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.35, "r_y0": 420.32, "r_x1": 286.37, "r_y1": 420.32, "r_x2": 286.37, "r_y2": 411.41, "r_x3": 200.35, "r_y3": 411.41, "coord_origin": "TOPLEFT" }, "text": "ensures a one-to-one", "orig": "ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 432.28, "r_x1": 286.37, "r_y1": 432.28, "r_x2": 286.37, "r_y2": 423.37, "r_x3": 50.11, "r_y3": 423.37, "coord_origin": "TOPLEFT" }, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.23, "r_x1": 158.3, "r_y1": 444.23, "r_x2": 158.3, "r_y2": 435.32, "r_x3": 50.11, "r_y3": 435.32, "coord_origin": "TOPLEFT" }, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets." }, { "label": "text", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 448.01, "r": 286.36, "b": 468.87, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 456.92, "r_x1": 286.36, "r_y1": 456.92, "r_x2": 286.36, "r_y2": 448.01, "r_x3": 62.07, "r_y3": 448.01, "coord_origin": "TOPLEFT" }, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 468.87, "r_x1": 91.38, "r_y1": 468.87, "r_x2": 91.38, "r_y2": 459.97, "r_x3": 50.11, "r_y3": 459.97, "coord_origin": "TOPLEFT" }, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The loss used to train the TableFormer can be defined as following:" }, { "label": "formula", "id": 15, "page_no": 5, "cluster": { "id": 15, "label": "formula", "bbox": { "l": 124.33, "t": 493.28, "r": 286.36, "b": 517.07, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.72, "r_y0": 502.13, "r_x1": 140.64, "r_y1": 502.13, "r_x2": 140.64, "r_y2": 493.28, "r_x3": 125.72, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.91, "r_y0": 502.13, "r_x1": 151.66, "r_y1": 502.13, "r_x2": 151.66, "r_y2": 493.28, "r_x3": 143.91, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.42, "r_y0": 502.13, "r_x1": 186.63, "r_y1": 502.13, "r_x2": 186.63, "r_y2": 493.28, "r_x3": 154.42, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$l$_{iou}$", "orig": "\u03bb$_{iou}$l$_{iou}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.34, "r_y0": 502.13, "r_x1": 197.09, "r_y1": 502.13, "r_x2": 197.09, "r_y2": 493.28, "r_x3": 189.34, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.3, "r_y0": 502.13, "r_x1": 211.65, "r_y1": 502.13, "r_x2": 211.65, "r_y2": 493.28, "r_x3": 199.3, "r_y3": 493.28, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.33, "r_y0": 517.07, "r_x1": 127.3, "r_y1": 517.07, "r_x2": 127.3, "r_y2": 508.22, "r_x3": 124.33, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 130.27, "r_y0": 517.07, "r_x1": 138.01, "r_y1": 517.07, "r_x2": 138.01, "r_y2": 508.22, "r_x3": 130.27, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.78, "r_y0": 517.07, "r_x1": 153.33, "r_y1": 517.07, "r_x2": 153.33, "r_y2": 508.22, "r_x3": 140.78, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bbl$_{s}$", "orig": "\u03bbl$_{s}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.04, "r_y0": 517.07, "r_x1": 174.86, "r_y1": 517.07, "r_x2": 174.86, "r_y2": 508.22, "r_x3": 156.04, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "+ (1", "orig": "+ (1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 177.07, "r_y0": 517.07, "r_x1": 184.82, "r_y1": 517.07, "r_x2": 184.82, "r_y2": 507.67, "r_x3": 177.07, "r_y3": 507.67, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.03, "r_y0": 517.07, "r_x1": 192.84, "r_y1": 517.07, "r_x2": 192.84, "r_y2": 508.22, "r_x3": 187.03, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.85, "r_y0": 517.07, "r_x1": 196.72, "r_y1": 517.07, "r_x2": 196.72, "r_y2": 508.22, "r_x3": 192.85, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.72, "r_y0": 517.07, "r_x1": 211.65, "r_y1": 517.07, "r_x2": 211.65, "r_y2": 508.22, "r_x3": 196.72, "r_y3": 508.22, "coord_origin": "TOPLEFT" }, "text": "l$_{box}$", "orig": "l$_{box}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 509.92, "r_x1": 286.36, "r_y1": 509.92, "r_x2": 286.36, "r_y2": 501.01, "r_x3": 274.75, "r_y3": 501.01, "coord_origin": "TOPLEFT" }, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)" }, { "label": "text", "id": 16, "page_no": 5, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 530.59, "r": 281.6, "b": 540.22, "coord_origin": "TOPLEFT" }, "confidence": 0.936, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 540.22, "r_x1": 74.45, "r_y1": 540.22, "r_x2": 74.45, "r_y2": 531.31, "r_x3": 50.11, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.94, "r_y0": 540.0, "r_x1": 82.75, "r_y1": 540.0, "r_x2": 82.75, "r_y2": 531.15, "r_x3": 76.94, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 85.52, "r_y0": 540.0, "r_x1": 92.16, "r_y1": 540.0, "r_x2": 92.16, "r_y2": 530.59, "r_x3": 85.52, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 94.65, "r_y0": 540.22, "r_x1": 135.6, "r_y1": 540.22, "r_x2": 135.6, "r_y2": 531.31, "r_x3": 94.65, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.09, "r_y0": 540.0, "r_x1": 172.63, "r_y1": 540.0, "r_x2": 172.63, "r_y2": 531.15, "r_x3": 138.09, "r_y3": 531.15, "coord_origin": "TOPLEFT" }, "text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.9, "r_y0": 540.0, "r_x1": 192.5, "r_y1": 540.0, "r_x2": 192.5, "r_y2": 530.59, "r_x3": 175.9, "r_y3": 530.59, "coord_origin": "TOPLEFT" }, "text": "\u2208$_{R}$", "orig": "\u2208$_{R}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.99, "r_y0": 540.22, "r_x1": 281.6, "r_y1": 540.22, "r_x2": 281.6, "r_y2": 531.31, "r_x3": 194.99, "r_y3": 531.31, "coord_origin": "TOPLEFT" }, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters." }, { "label": "section_header", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 555.92, "r": 171.98, "b": 566.66, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 566.66, "r_x1": 57.93, "r_y1": 566.66, "r_x2": 57.93, "r_y2": 555.92, "r_x3": 50.11, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.35, "r_y0": 566.66, "r_x1": 171.98, "r_y1": 566.66, "r_x2": 171.98, "r_y2": 555.92, "r_x3": 68.35, "r_y3": 555.92, "coord_origin": "TOPLEFT" }, "text": "Experimental Results", "orig": "Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Experimental Results" }, { "label": "section_header", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 576.26, "r": 179.18, "b": 586.12, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 586.12, "r_x1": 64.69, "r_y1": 586.12, "r_x2": 64.69, "r_y2": 576.26, "r_x3": 50.11, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "5.1.", "orig": "5.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.41, "r_y0": 586.12, "r_x1": 179.18, "r_y1": 586.12, "r_x2": 179.18, "r_y2": 576.26, "r_x3": 74.41, "r_y3": 576.26, "coord_origin": "TOPLEFT" }, "text": "Implementation Details", "orig": "Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1. Implementation Details" }, { "label": "text", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 595.73, "r": 286.37, "b": 640.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 604.64, "r_x1": 202.98, "r_y1": 604.64, "r_x2": 202.98, "r_y2": 595.73, "r_x3": 62.07, "r_y3": 595.73, "coord_origin": "TOPLEFT" }, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 205.38, "r_y0": 604.41, "r_x1": 286.36, "r_y1": 604.41, "r_x2": 286.36, "r_y2": 595.82, "r_x3": 205.38, "r_y3": 595.82, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 616.37, "r_x1": 70.04, "r_y1": 616.37, "r_x2": 70.04, "r_y2": 607.78, "r_x3": 50.11, "r_y3": 607.78, "coord_origin": "TOPLEFT" }, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 616.6, "r_x1": 286.36, "r_y1": 616.6, "r_x2": 286.36, "r_y2": 607.69, "r_x3": 70.04, "r_y3": 607.69, "coord_origin": "TOPLEFT" }, "text": ". The input images are resized to 448*448 pixels and", "orig": ". The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 628.55, "r_x1": 286.37, "r_y1": 628.55, "r_x2": 286.37, "r_y2": 619.64, "r_x3": 50.11, "r_y3": 619.64, "coord_origin": "TOPLEFT" }, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 640.51, "r_x1": 207.03, "r_y1": 640.51, "r_x2": 207.03, "r_y2": 631.6, "r_x3": 50.11, "r_y3": 631.6, "coord_origin": "TOPLEFT" }, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:" }, { "label": "formula", "id": 18, "page_no": 5, "cluster": { "id": 18, "label": "formula", "bbox": { "l": 91.66, "t": 653.83, "r": 286.36, "b": 678.4, "coord_origin": "TOPLEFT" }, "confidence": 0.844, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.66, "r_y0": 663.45, "r_x1": 186.02, "r_y1": 663.45, "r_x2": 186.02, "r_y2": 654.55, "r_x3": 91.66, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.51, "r_y0": 663.23, "r_x1": 196.26, "r_y1": 663.23, "r_x2": 196.26, "r_y2": 653.83, "r_x3": 188.51, "r_y3": 653.83, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.75, "r_y0": 663.45, "r_x1": 244.81, "r_y1": 663.45, "r_x2": 244.81, "r_y2": 654.55, "r_x3": 198.75, "r_y3": 654.55, "coord_origin": "TOPLEFT" }, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.02, "r_y0": 678.4, "r_x1": 186.25, "r_y1": 678.4, "r_x2": 186.25, "r_y2": 669.49, "r_x3": 101.02, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.74, "r_y0": 678.18, "r_x1": 196.48, "r_y1": 678.18, "r_x2": 196.48, "r_y2": 668.77, "r_x3": 188.74, "r_y3": 668.77, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.98, "r_y0": 678.4, "r_x1": 244.81, "r_y1": 678.4, "r_x2": 244.81, "r_y2": 669.49, "r_x3": 198.98, "r_y3": 669.49, "coord_origin": "TOPLEFT" }, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 671.02, "r_x1": 286.36, "r_y1": 671.02, "r_x2": 286.36, "r_y2": 662.12, "r_x3": 274.75, "r_y3": 662.12, "coord_origin": "TOPLEFT" }, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)" }, { "label": "text", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "text", "bbox": { "l": 50.11, "t": 692.29, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved" }, { "label": "text", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 545.12, "r_y1": 84.11, "r_x2": 545.12, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 339.99, "r_y1": 96.07, "r_x2": 339.99, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.89, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 346.89, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 492.96, "r_y1": 108.02, "r_x2": 492.96, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 116.23, "r": 545.12, "b": 328.37, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 125.14, "r_x1": 545.11, "r_y1": 125.14, "r_x2": 545.11, "r_y2": 116.23, "r_x3": 320.82, "r_y3": 116.23, "coord_origin": "TOPLEFT" }, "text": "The Transformer Encoder consists of two \u201cTransformer", "orig": "The Transformer Encoder consists of two \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 137.09, "r_x1": 545.12, "r_y1": 137.09, "r_x2": 545.12, "r_y2": 128.18, "r_x3": 308.86, "r_y3": 128.18, "coord_origin": "TOPLEFT" }, "text": "Encoder Layers\u201d, with an input feature size of 512, feed", "orig": "Encoder Layers\u201d, with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 149.05, "r_x1": 545.12, "r_y1": 149.05, "r_x2": 545.12, "r_y2": 140.14, "r_x3": 308.86, "r_y3": 140.14, "coord_origin": "TOPLEFT" }, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 161.0, "r_x1": 545.12, "r_y1": 161.0, "r_x2": 545.12, "r_y2": 152.09, "r_x3": 308.86, "r_y3": 152.09, "coord_origin": "TOPLEFT" }, "text": "Transformer Decoder it is composed of four \u201cTransformer", "orig": "Transformer Decoder it is composed of four \u201cTransformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 172.96, "r_x1": 545.12, "r_y1": 172.96, "r_x2": 545.12, "r_y2": 164.05, "r_x3": 308.86, "r_y3": 164.05, "coord_origin": "TOPLEFT" }, "text": "Decoder Layers\u201d with similar input and output dimensions", "orig": "Decoder Layers\u201d with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 184.91, "r_x1": 467.22, "r_y1": 184.91, "r_x2": 467.22, "r_y2": 176.01, "r_x3": 308.86, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "as the \u201cTransformer Encoder Layers\u201d.", "orig": "as the \u201cTransformer Encoder Layers\u201d.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.44, "r_y0": 184.91, "r_x1": 545.12, "r_y1": 184.91, "r_x2": 545.12, "r_y2": 176.01, "r_x3": 475.44, "r_y3": 176.01, "coord_origin": "TOPLEFT" }, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 196.87, "r_x1": 545.12, "r_y1": 196.87, "r_x2": 545.12, "r_y2": 187.96, "r_x3": 308.86, "r_y3": 187.96, "coord_origin": "TOPLEFT" }, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 208.82, "r_x1": 545.12, "r_y1": 208.82, "r_x2": 545.12, "r_y2": 199.92, "r_x3": 308.86, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "mentation parameters, our extensive experimentation has", "orig": "mentation parameters, our extensive experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 220.78, "r_x1": 545.12, "r_y1": 220.78, "r_x2": 545.12, "r_y2": 211.87, "r_x3": 308.86, "r_y3": 211.87, "coord_origin": "TOPLEFT" }, "text": "proved this setup to be more suitable for table images. We", "orig": "proved this setup to be more suitable for table images. We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.73, "r_x1": 545.12, "r_y1": 232.73, "r_x2": 545.12, "r_y2": 223.83, "r_x3": 308.86, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "attribute this finding to the inherent design of table im-", "orig": "attribute this finding to the inherent design of table im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 244.69, "r_x1": 545.12, "r_y1": 244.69, "r_x2": 545.12, "r_y2": 235.78, "r_x3": 308.86, "r_y3": 235.78, "coord_origin": "TOPLEFT" }, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.64, "r_x1": 545.12, "r_y1": 256.64, "r_x2": 545.12, "r_y2": 247.74, "r_x3": 308.86, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "elaborate content present in other scopes (e.g. the COCO", "orig": "elaborate content present in other scopes (e.g. the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.6, "r_x1": 342.34, "r_y1": 268.6, "r_x2": 342.34, "r_y2": 259.69, "r_x3": 308.86, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.95, "r_y0": 268.6, "r_x1": 545.12, "r_y1": 268.6, "r_x2": 545.12, "r_y2": 259.69, "r_x3": 348.95, "r_y3": 259.69, "coord_origin": "TOPLEFT" }, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.55, "r_x1": 545.12, "r_y1": 280.55, "r_x2": 545.12, "r_y2": 271.65, "r_x3": 308.86, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.51, "r_x1": 545.12, "r_y1": 292.51, "r_x2": 545.12, "r_y2": 283.6, "r_x3": 308.86, "r_y3": 283.6, "coord_origin": "TOPLEFT" }, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.46, "r_x1": 545.12, "r_y1": 304.46, "r_x2": 545.12, "r_y2": 295.56, "r_x3": 308.86, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.42, "r_x1": 545.12, "r_y1": 316.42, "r_x2": 545.12, "r_y2": 307.51, "r_x3": 308.86, "r_y3": 307.51, "coord_origin": "TOPLEFT" }, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.37, "r_x1": 532.48, "r_y1": 328.37, "r_x2": 532.48, "r_y2": 319.47, "r_x3": 308.86, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 308.86, "t": 336.58, "r": 545.12, "b": 429.17, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 345.48, "r_x1": 545.11, "r_y1": 345.48, "r_x2": 545.11, "r_y2": 336.58, "r_x3": 320.82, "r_y3": 336.58, "coord_origin": "TOPLEFT" }, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 357.44, "r_x1": 403.74, "r_y1": 357.44, "r_x2": 403.74, "r_y2": 348.53, "r_x3": 308.86, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.08, "r_y0": 357.21, "r_x1": 503.54, "r_y1": 357.21, "r_x2": 503.54, "r_y2": 348.62, "r_x3": 406.08, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 503.54, "r_y0": 357.44, "r_x1": 506.03, "r_y1": 357.44, "r_x2": 506.03, "r_y2": 348.53, "r_x3": 503.54, "r_y3": 348.53, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.4, "r_y0": 357.21, "r_x1": 545.11, "r_y1": 357.21, "r_x2": 545.11, "r_y2": 348.62, "r_x3": 508.4, "r_y3": 348.62, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 369.16, "r_x1": 343.16, "r_y1": 369.16, "r_x2": 343.16, "r_y2": 360.58, "r_x3": 308.86, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 343.16, "r_y0": 369.39, "r_x1": 362.2, "r_y1": 369.39, "r_x2": 362.2, "r_y2": 360.49, "r_x3": 343.16, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 364.29, "r_y0": 369.16, "r_x1": 440.94, "r_y1": 369.16, "r_x2": 440.94, "r_y2": 360.58, "r_x3": 364.29, "r_y3": 360.58, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.94, "r_y0": 369.39, "r_x1": 545.11, "r_y1": 369.39, "r_x2": 545.11, "r_y2": 360.49, "r_x3": 440.94, "r_y3": 360.49, "coord_origin": "TOPLEFT" }, "text": ". Taking the PubTabNet as", "orig": ". Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 381.35, "r_x1": 545.12, "r_y1": 381.35, "r_x2": 545.12, "r_y2": 372.44, "r_x3": 308.86, "r_y3": 372.44, "coord_origin": "TOPLEFT" }, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 393.31, "r_x1": 545.12, "r_y1": 393.31, "r_x2": 545.12, "r_y2": 384.4, "r_x3": 308.86, "r_y3": 384.4, "coord_origin": "TOPLEFT" }, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 405.04, "r_x1": 314.67, "r_y1": 405.04, "r_x2": 314.67, "r_y2": 396.19, "r_x3": 308.86, "r_y3": 396.19, "coord_origin": "TOPLEFT" }, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.66, "r_y0": 405.26, "r_x1": 360.39, "r_y1": 405.26, "r_x2": 360.39, "r_y2": 396.35, "r_x3": 318.66, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "set to 0.5.", "orig": "set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.96, "r_y0": 405.26, "r_x1": 545.11, "r_y1": 405.26, "r_x2": 545.11, "r_y2": 396.35, "r_x3": 367.96, "r_y3": 396.35, "coord_origin": "TOPLEFT" }, "text": "Afterwards, we reduce the learning rate to", "orig": "Afterwards, we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 417.21, "r_x1": 545.12, "r_y1": 417.21, "r_x2": 545.12, "r_y2": 408.31, "r_x3": 308.86, "r_y3": 408.31, "coord_origin": "TOPLEFT" }, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 429.17, "r_x1": 360.97, "r_y1": 429.17, "r_x2": 360.97, "r_y2": 420.26, "r_x3": 308.86, "r_y3": 420.26, "coord_origin": "TOPLEFT" }, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence." }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 437.37, "r": 545.12, "b": 553.88, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 446.28, "r_x1": 545.11, "r_y1": 446.28, "r_x2": 545.11, "r_y2": 437.37, "r_x3": 320.82, "r_y3": 437.37, "coord_origin": "TOPLEFT" }, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 458.24, "r_x1": 384.63, "r_y1": 458.24, "r_x2": 384.63, "r_y2": 449.33, "r_x3": 308.86, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 458.24, "r_x1": 545.12, "r_y1": 458.24, "r_x2": 545.12, "r_y2": 449.33, "r_x3": 391.37, "r_y3": 449.33, "coord_origin": "TOPLEFT" }, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 470.19, "r_x1": 494.01, "r_y1": 470.19, "r_x2": 494.01, "r_y2": 461.28, "r_x3": 308.86, "r_y3": 461.28, "coord_origin": "TOPLEFT" }, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.08, "r_y0": 469.96, "r_x1": 545.11, "r_y1": 469.96, "r_x2": 545.11, "r_y2": 461.37, "r_x3": 498.08, "r_y3": 461.37, "coord_origin": "TOPLEFT" }, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 481.92, "r_x1": 364.44, "r_y1": 481.92, "r_x2": 364.44, "r_y2": 473.33, "r_x3": 308.86, "r_y3": 473.33, "coord_origin": "TOPLEFT" }, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 482.15, "r_x1": 545.11, "r_y1": 482.15, "r_x2": 545.11, "r_y2": 473.24, "r_x3": 367.06, "r_y3": 473.24, "coord_origin": "TOPLEFT" }, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 494.1, "r_x1": 545.12, "r_y1": 494.1, "r_x2": 545.12, "r_y2": 485.19, "r_x3": 308.86, "r_y3": 485.19, "coord_origin": "TOPLEFT" }, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 506.06, "r_x1": 545.12, "r_y1": 506.06, "r_x2": 545.12, "r_y2": 497.15, "r_x3": 308.86, "r_y3": 497.15, "coord_origin": "TOPLEFT" }, "text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 518.01, "r_x1": 545.12, "r_y1": 518.01, "r_x2": 545.12, "r_y2": 509.11, "r_x3": 308.86, "r_y3": 509.11, "coord_origin": "TOPLEFT" }, "text": "faster autoregressive decoding. This is achieved by storing", "orig": "faster autoregressive decoding. This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 529.97, "r_x1": 545.12, "r_y1": 529.97, "r_x2": 545.12, "r_y2": 521.06, "r_x3": 308.86, "r_y3": 521.06, "coord_origin": "TOPLEFT" }, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 541.92, "r_x1": 545.12, "r_y1": 541.92, "r_x2": 545.12, "r_y2": 533.02, "r_x3": 308.86, "r_y3": 533.02, "coord_origin": "TOPLEFT" }, "text": "each time step. Therefore, we only compute the attention", "orig": "each time step. Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 553.88, "r_x1": 377.22, "r_y1": 553.88, "r_x2": 377.22, "r_y2": 544.97, "r_x3": 308.86, "r_y3": 544.97, "coord_origin": "TOPLEFT" }, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag." }, { "label": "section_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 308.86, "t": 579.55, "r": 397.44, "b": 589.41, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 589.41, "r_x1": 323.9, "r_y1": 589.41, "r_x2": 323.9, "r_y2": 579.55, "r_x3": 308.86, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "5.2.", "orig": "5.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.93, "r_y0": 589.41, "r_x1": 397.44, "r_y1": 589.41, "r_x2": 397.44, "r_y2": 579.55, "r_x3": 333.93, "r_y3": 579.55, "coord_origin": "TOPLEFT" }, "text": "Generalization", "orig": "Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2. Generalization" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 308.86, "t": 603.45, "r": 545.12, "b": 672.13, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 612.36, "r_x1": 545.11, "r_y1": 612.36, "r_x2": 545.11, "r_y2": 603.45, "r_x3": 320.82, "r_y3": 603.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 624.31, "r_x1": 545.12, "r_y1": 624.31, "r_x2": 545.12, "r_y2": 615.4, "r_x3": 308.86, "r_y3": 615.4, "coord_origin": "TOPLEFT" }, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 636.27, "r_x1": 545.12, "r_y1": 636.27, "r_x2": 545.12, "r_y2": 627.36, "r_x3": 308.86, "r_y3": 627.36, "coord_origin": "TOPLEFT" }, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 648.22, "r_x1": 545.12, "r_y1": 648.22, "r_x2": 545.12, "r_y2": 639.31, "r_x3": 308.86, "r_y3": 639.31, "coord_origin": "TOPLEFT" }, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 660.18, "r_x1": 545.12, "r_y1": 660.18, "r_x2": 545.12, "r_y2": 651.27, "r_x3": 308.86, "r_y3": 651.27, "coord_origin": "TOPLEFT" }, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 672.13, "r_x1": 350.7, "r_y1": 672.13, "r_x2": 350.7, "r_y2": 663.23, "r_x3": 308.86, "r_y3": 663.23, "coord_origin": "TOPLEFT" }, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively." }, { "label": "text", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 680.34, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 689.24, "r_x1": 545.12, "r_y1": 689.24, "r_x2": 545.12, "r_y2": 680.34, "r_x3": 320.82, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 701.2, "r_x1": 396.21, "r_y1": 701.2, "r_x2": 396.21, "r_y2": 692.29, "r_x3": 308.86, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet dataset.", "orig": "SynthTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.41, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 406.41, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Throughout our experiments, the", "orig": "Throughout our experiments, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 495.94, "r_y1": 713.15, "r_x2": 495.94, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized." } ], "headers": [ { "label": "page_footer", "id": 17, "page_no": 5, "cluster": { "id": 17, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" } ] } }, { "page_no": 6, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.25, "r_x1": 63.7, "r_y1": 84.25, "r_x2": 63.7, "r_y2": 74.4, "r_x3": 50.11, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.77, "r_y0": 84.25, "r_x1": 167.9, "r_y1": 84.25, "r_x2": 167.9, "r_y2": 74.4, "r_x3": 72.77, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 102.26, "r_x1": 286.36, "r_y1": 102.26, "r_x2": 286.36, "r_y2": 93.35, "r_x3": 62.07, "r_y3": 93.35, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 114.21, "r_x1": 286.37, "r_y1": 114.21, "r_x2": 286.37, "r_y2": 105.31, "r_x3": 50.11, "r_y3": 105.31, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 126.17, "r_x1": 286.37, "r_y1": 126.17, "r_x2": 286.37, "r_y2": 117.26, "r_x3": 50.11, "r_y3": 117.26, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 138.12, "r_x1": 136.72, "r_y1": 138.12, "r_x2": 136.72, "r_y2": 129.22, "r_x3": 50.11, "r_y3": 129.22, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.22, "r_y0": 165.9, "r_x1": 118.88, "r_y1": 165.9, "r_x2": 118.88, "r_y2": 157.06, "r_x3": 86.22, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87, "r_y0": 165.9, "r_x1": 143.27, "r_y1": 165.9, "r_x2": 143.27, "r_y2": 157.06, "r_x3": 118.87, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.77, "r_y0": 165.9, "r_x1": 165.9, "r_y1": 165.9, "r_x2": 165.9, "r_y2": 157.06, "r_x3": 143.77, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12, "r_y0": 165.9, "r_x1": 175.87, "r_y1": 165.9, "r_x2": 175.87, "r_y2": 156.5, "r_x3": 168.12, "r_y3": 156.5, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.28, "r_y0": 159.16, "r_x1": 221.96, "r_y1": 159.16, "r_x2": 221.96, "r_y2": 150.32, "r_x3": 179.28, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95, "r_y0": 159.16, "r_x1": 246.35, "r_y1": 159.16, "r_x2": 246.35, "r_y2": 150.32, "r_x3": 221.95, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84, "r_y0": 159.16, "r_x1": 250.72, "r_y1": 159.16, "r_x2": 250.72, "r_y2": 150.32, "r_x3": 246.84, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21, "r_y0": 172.74, "r_x1": 206.29, "r_y1": 172.74, "r_x2": 206.29, "r_y2": 163.89, "r_x3": 182.21, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.29, "r_y0": 172.74, "r_x1": 209.06, "r_y1": 172.74, "r_x2": 209.06, "r_y2": 163.33, "r_x3": 206.29, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.06, "r_y0": 172.74, "r_x1": 219.2, "r_y1": 172.74, "r_x2": 219.2, "r_y2": 163.89, "r_x3": 209.06, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.7, "r_y0": 172.74, "r_x1": 222.46, "r_y1": 172.74, "r_x2": 222.46, "r_y2": 163.33, "r_x3": 219.7, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.12, "r_y0": 172.74, "r_x1": 226.89, "r_y1": 172.74, "r_x2": 226.89, "r_y2": 163.89, "r_x3": 224.12, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55, "r_y0": 172.74, "r_x1": 231.32, "r_y1": 172.74, "r_x2": 231.32, "r_y2": 163.33, "r_x3": 228.55, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.32, "r_y0": 172.74, "r_x1": 240.65, "r_y1": 172.74, "r_x2": 240.65, "r_y2": 163.89, "r_x3": 231.32, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.14, "r_y0": 172.74, "r_x1": 243.91, "r_y1": 172.74, "r_x2": 243.91, "r_y2": 163.33, "r_x3": 241.14, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.91, "r_y0": 172.74, "r_x1": 247.79, "r_y1": 172.74, "r_x2": 247.79, "r_y2": 163.89, "r_x3": 243.91, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 166.12, "r_x1": 286.36, "r_y1": 166.12, "r_x2": 286.36, "r_y2": 157.22, "r_x3": 274.75, "r_y3": 157.22, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 190.07, "r_x1": 86.41, "r_y1": 190.07, "r_x2": 86.41, "r_y2": 181.16, "r_x3": 62.07, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.58, "r_y0": 189.85, "r_x1": 98.72, "r_y1": 189.85, "r_x2": 98.72, "r_y2": 181.0, "r_x3": 88.58, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.4, "r_y0": 190.07, "r_x1": 115.78, "r_y1": 190.07, "r_x2": 115.78, "r_y2": 181.16, "r_x3": 101.4, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.96, "r_y0": 189.85, "r_x1": 127.29, "r_y1": 189.85, "r_x2": 127.29, "r_y2": 181.0, "r_x3": 117.96, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.96, "r_y0": 190.07, "r_x1": 286.36, "r_y1": 190.07, "r_x2": 286.36, "r_y2": 181.16, "r_x3": 129.96, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 202.02, "r_x1": 252.78, "r_y1": 202.02, "r_x2": 252.78, "r_y2": 193.12, "r_x3": 50.11, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18, "r_y0": 201.8, "r_x1": 257.95, "r_y1": 201.8, "r_x2": 257.95, "r_y2": 192.4, "r_x3": 255.18, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.95, "r_y0": 201.8, "r_x1": 263.77, "r_y1": 201.8, "r_x2": 263.77, "r_y2": 192.96, "r_x3": 257.95, "r_y3": 192.96, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.15, "r_y0": 201.8, "r_x1": 267.92, "r_y1": 201.8, "r_x2": 267.92, "r_y2": 192.4, "r_x3": 265.15, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32, "r_y0": 202.02, "r_x1": 286.36, "r_y1": 202.02, "r_x2": 286.36, "r_y2": 193.12, "r_x3": 270.32, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.98, "r_x1": 172.13, "r_y1": 213.98, "r_x2": 172.13, "r_y2": 205.07, "r_x3": 50.11, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62, "r_y0": 213.76, "r_x1": 180.45, "r_y1": 213.76, "r_x2": 180.45, "r_y2": 204.91, "r_x3": 174.62, "r_y3": 204.91, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.83, "r_y0": 213.98, "r_x1": 184.32, "r_y1": 213.98, "r_x2": 184.32, "r_y2": 205.07, "r_x3": 181.83, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 234.67, "r_x1": 64.55, "r_y1": 234.67, "r_x2": 64.55, "r_y2": 224.82, "r_x3": 50.11, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.18, "r_y0": 234.67, "r_x1": 170.45, "r_y1": 234.67, "r_x2": 170.45, "r_y2": 224.82, "r_x3": 74.18, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.61, "r_x1": 105.32, "r_y1": 252.61, "r_x2": 105.32, "r_y2": 243.65, "r_x3": 62.07, "r_y3": 243.65, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.13, "r_y0": 252.68, "r_x1": 184.68, "r_y1": 252.68, "r_x2": 184.68, "r_y2": 243.77, "r_x3": 112.13, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.48, "r_y0": 252.68, "r_x1": 286.36, "r_y1": 252.68, "r_x2": 286.36, "r_y2": 243.77, "r_x3": 191.48, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.63, "r_x1": 286.37, "r_y1": 264.63, "r_x2": 286.37, "r_y2": 255.72, "r_x3": 50.11, "r_y3": 255.72, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.59, "r_x1": 286.37, "r_y1": 276.59, "r_x2": 286.37, "r_y2": 267.68, "r_x3": 50.11, "r_y3": 267.68, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.54, "r_x1": 286.37, "r_y1": 288.54, "r_x2": 286.37, "r_y2": 279.63, "r_x3": 50.11, "r_y3": 279.63, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.5, "r_x1": 286.37, "r_y1": 300.5, "r_x2": 286.37, "r_y2": 291.59, "r_x3": 50.11, "r_y3": 291.59, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.45, "r_x1": 286.37, "r_y1": 312.45, "r_x2": 286.37, "r_y2": 303.55, "r_x3": 50.11, "r_y3": 303.55, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.41, "r_x1": 286.37, "r_y1": 324.41, "r_x2": 286.37, "r_y2": 315.5, "r_x3": 50.11, "r_y3": 315.5, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.36, "r_x1": 286.37, "r_y1": 336.36, "r_x2": 286.37, "r_y2": 327.46, "r_x3": 50.11, "r_y3": 327.46, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.32, "r_x1": 286.37, "r_y1": 348.32, "r_x2": 286.37, "r_y2": 339.41, "r_x3": 50.11, "r_y3": 339.41, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.27, "r_x1": 286.37, "r_y1": 360.27, "r_x2": 286.37, "r_y2": 351.37, "r_x3": 50.11, "r_y3": 351.37, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.23, "r_x1": 286.37, "r_y1": 372.23, "r_x2": 286.37, "r_y2": 363.32, "r_x3": 50.11, "r_y3": 363.32, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.18, "r_x1": 286.37, "r_y1": 384.18, "r_x2": 286.37, "r_y2": 375.28, "r_x3": 50.11, "r_y3": 375.28, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.14, "r_x1": 170.01, "r_y1": 396.14, "r_x2": 170.01, "r_y2": 387.23, "r_x3": 50.11, "r_y3": 387.23, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 601.34, "r_x1": 286.37, "r_y1": 601.34, "r_x2": 286.37, "r_y2": 592.43, "r_x3": 50.11, "r_y3": 592.43, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 613.29, "r_x1": 247.46, "r_y1": 613.29, "r_x2": 247.46, "r_y2": 604.39, "r_x3": 50.11, "r_y3": 604.39, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 625.25, "r_x1": 261.79, "r_y1": 625.25, "r_x2": 261.79, "r_y2": 616.34, "r_x3": 50.11, "r_y3": 616.34, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 653.31, "r_x1": 124.72, "r_y1": 653.31, "r_x2": 124.72, "r_y2": 644.35, "r_x3": 62.07, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.2, "r_y0": 653.38, "r_x1": 242.93, "r_y1": 653.38, "r_x2": 242.93, "r_y2": 644.47, "r_x3": 128.2, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55, "r_y0": 653.15, "r_x1": 286.36, "r_y1": 653.15, "r_x2": 286.36, "r_y2": 644.56, "r_x3": 245.55, "r_y3": 644.56, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.1, "r_x1": 84.97, "r_y1": 665.1, "r_x2": 84.97, "r_y2": 656.51, "r_x3": 50.11, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.52, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 89.52, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 322.14, "r_y1": 84.11, "r_x2": 322.14, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45, "r_y0": 83.89, "r_x1": 404.57, "r_y1": 83.89, "r_x2": 404.57, "r_y2": 75.3, "r_x3": 325.45, "r_y3": 75.3, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.1, "r_y0": 84.11, "r_x1": 545.11, "r_y1": 84.11, "r_x2": 545.11, "r_y2": 75.21, "r_x3": 408.1, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 470.23, "r_y1": 108.02, "r_x2": 470.23, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.53, "r_y0": 108.02, "r_x1": 545.12, "r_y1": 108.02, "r_x2": 545.12, "r_y2": 99.12, "r_x3": 477.53, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 119.98, "r_x1": 545.12, "r_y1": 119.98, "r_x2": 545.12, "r_y2": 111.07, "r_x3": 308.86, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 131.93, "r_x1": 545.12, "r_y1": 131.93, "r_x2": 545.12, "r_y2": 123.03, "r_x3": 308.86, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 143.89, "r_x1": 502.02, "r_y1": 143.89, "r_x2": 502.02, "r_y2": 134.98, "r_x3": 308.86, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47, "r_y0": 143.66, "r_x1": 545.11, "r_y1": 143.66, "r_x2": 545.11, "r_y2": 135.07, "r_x3": 504.47, "r_y3": 135.07, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 155.62, "r_x1": 343.16, "r_y1": 155.62, "r_x2": 343.16, "r_y2": 147.03, "r_x3": 308.86, "r_y3": 147.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37, "r_y0": 155.85, "r_x1": 545.11, "r_y1": 155.85, "r_x2": 545.11, "r_y2": 146.94, "r_x3": 346.37, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 167.8, "r_x1": 446.16, "r_y1": 167.8, "r_x2": 446.16, "r_y2": 158.89, "r_x3": 308.86, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.29, "r_y0": 167.57, "r_x1": 525.04, "r_y1": 167.57, "r_x2": 525.04, "r_y2": 158.98, "r_x3": 448.29, "r_y3": 158.98, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.4, "r_y0": 167.8, "r_x1": 545.11, "r_y1": 167.8, "r_x2": 545.11, "r_y2": 158.89, "r_x3": 527.4, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 179.76, "r_x1": 545.12, "r_y1": 179.76, "r_x2": 545.12, "r_y2": 170.85, "r_x3": 308.86, "r_y3": 170.85, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 191.71, "r_x1": 432.87, "r_y1": 191.71, "r_x2": 432.87, "r_y2": 182.8, "r_x3": 308.86, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39, "r_y0": 191.48, "r_x1": 510.93, "r_y1": 191.48, "r_x2": 510.93, "r_y2": 182.89, "r_x3": 436.39, "r_y3": 182.89, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.68, "r_y0": 191.71, "r_x1": 545.11, "r_y1": 191.71, "r_x2": 545.11, "r_y2": 182.8, "r_x3": 514.68, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 203.67, "r_x1": 431.17, "r_y1": 203.67, "r_x2": 431.17, "r_y2": 194.76, "r_x3": 308.86, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.68, "r_y0": 203.44, "r_x1": 514.18, "r_y1": 203.44, "r_x2": 514.18, "r_y2": 194.85, "r_x3": 434.68, "r_y3": 194.85, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.18, "r_y0": 203.67, "r_x1": 545.11, "r_y1": 203.67, "r_x2": 545.11, "r_y2": 194.76, "r_x3": 514.18, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 215.39, "r_x1": 382.36, "r_y1": 215.39, "r_x2": 382.36, "r_y2": 206.81, "r_x3": 308.86, "r_y3": 206.81, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.08, "r_y0": 215.62, "r_x1": 545.11, "r_y1": 215.62, "r_x2": 545.11, "r_y2": 206.72, "r_x3": 385.08, "r_y3": 206.72, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 227.58, "r_x1": 501.7, "r_y1": 227.58, "r_x2": 501.7, "r_y2": 218.67, "r_x3": 308.86, "r_y3": 218.67, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 325.36, "r_x1": 341.5, "r_y1": 325.36, "r_x2": 341.5, "r_y2": 316.45, "r_x3": 308.86, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.6, "r_y0": 325.36, "r_x1": 545.12, "r_y1": 325.36, "r_x2": 545.12, "r_y2": 316.45, "r_x3": 348.6, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.31, "r_x1": 474.98, "r_y1": 337.31, "r_x2": 474.98, "r_y2": 328.4, "r_x3": 308.86, "r_y3": 328.4, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 376.64, "r_x1": 378.95, "r_y1": 376.64, "r_x2": 378.95, "r_y2": 367.68, "r_x3": 320.82, "r_y3": 367.68, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.08, "r_y0": 376.71, "r_x1": 545.12, "r_y1": 376.71, "r_x2": 545.12, "r_y2": 367.8, "r_x3": 387.08, "r_y3": 367.8, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.66, "r_x1": 487.19, "r_y1": 388.66, "r_x2": 487.19, "r_y2": 379.75, "r_x3": 308.86, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.97, "r_y0": 388.66, "r_x1": 545.12, "r_y1": 388.66, "r_x2": 545.12, "r_y2": 379.75, "r_x3": 493.97, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.62, "r_x1": 545.12, "r_y1": 400.62, "r_x2": 545.12, "r_y2": 391.71, "r_x3": 308.86, "r_y3": 391.71, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.57, "r_x1": 545.12, "r_y1": 412.57, "r_x2": 545.12, "r_y2": 403.67, "r_x3": 308.86, "r_y3": 403.67, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.53, "r_x1": 314.08, "r_y1": 424.53, "r_x2": 314.08, "r_y2": 415.62, "r_x3": 308.86, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69, "r_y0": 424.53, "r_x1": 545.12, "r_y1": 424.53, "r_x2": 545.12, "r_y2": 415.62, "r_x3": 316.69, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.48, "r_x1": 545.12, "r_y1": 436.48, "r_x2": 545.12, "r_y2": 427.58, "r_x3": 308.86, "r_y3": 427.58, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.44, "r_x1": 545.12, "r_y1": 448.44, "r_x2": 545.12, "r_y2": 439.53, "r_x3": 308.86, "r_y3": 439.53, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 460.39, "r_x1": 350.24, "r_y1": 460.39, "r_x2": 350.24, "r_y2": 451.49, "r_x3": 308.86, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.18, "r_y0": 460.32, "r_x1": 374.59, "r_y1": 460.32, "r_x2": 374.59, "r_y2": 451.37, "r_x3": 352.18, "r_y3": 451.37, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53, "r_y0": 460.39, "r_x1": 545.11, "r_y1": 460.39, "r_x2": 545.11, "r_y2": 451.49, "r_x3": 376.53, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 472.35, "r_x1": 545.12, "r_y1": 472.35, "r_x2": 545.12, "r_y2": 463.44, "r_x3": 308.86, "r_y3": 463.44, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.3, "r_x1": 545.12, "r_y1": 484.3, "r_x2": 545.12, "r_y2": 475.4, "r_x3": 308.86, "r_y3": 475.4, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.26, "r_x1": 545.12, "r_y1": 496.26, "r_x2": 545.12, "r_y2": 487.35, "r_x3": 308.86, "r_y3": 487.35, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.21, "r_x1": 545.12, "r_y1": 508.21, "r_x2": 545.12, "r_y2": 499.31, "r_x3": 308.86, "r_y3": 499.31, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.17, "r_x1": 405.7, "r_y1": 520.17, "r_x2": 405.7, "r_y2": 511.26, "r_x3": 308.86, "r_y3": 511.26, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.77, "r_x1": 341.74, "r_y1": 665.77, "r_x2": 341.74, "r_y2": 656.86, "r_x3": 308.86, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.56, "r_y0": 665.77, "r_x1": 545.12, "r_y1": 665.77, "r_x2": 545.12, "r_y2": 656.86, "r_x3": 349.56, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.72, "r_x1": 545.12, "r_y1": 677.72, "r_x2": 545.12, "r_y2": 668.82, "r_x3": 308.86, "r_y3": 668.82, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.68, "r_x1": 435.04, "r_y1": 689.68, "r_x2": 435.04, "r_y2": 680.77, "r_x3": 308.86, "r_y3": 680.77, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "section_header", "bbox": { "l": 50.11, "t": 74.4, "r": 167.9, "b": 84.25, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.25, "r_x1": 63.7, "r_y1": 84.25, "r_x2": 63.7, "r_y2": 74.4, "r_x3": 50.11, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.77, "r_y0": 84.25, "r_x1": 167.9, "r_y1": 84.25, "r_x2": 167.9, "r_y2": 74.4, "r_x3": 72.77, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 93.35, "r": 286.37, "b": 138.12, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 102.26, "r_x1": 286.36, "r_y1": 102.26, "r_x2": 286.36, "r_y2": 93.35, "r_x3": 62.07, "r_y3": 93.35, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 114.21, "r_x1": 286.37, "r_y1": 114.21, "r_x2": 286.37, "r_y2": 105.31, "r_x3": 50.11, "r_y3": 105.31, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 126.17, "r_x1": 286.37, "r_y1": 126.17, "r_x2": 286.37, "r_y2": 117.26, "r_x3": 50.11, "r_y3": 117.26, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 138.12, "r_x1": 136.72, "r_y1": 138.12, "r_x2": 136.72, "r_y2": 129.22, "r_x3": 50.11, "r_y3": 129.22, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "formula", "bbox": { "l": 86.22, "t": 150.32, "r": 286.36, "b": 172.74, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.22, "r_y0": 165.9, "r_x1": 118.88, "r_y1": 165.9, "r_x2": 118.88, "r_y2": 157.06, "r_x3": 86.22, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87, "r_y0": 165.9, "r_x1": 143.27, "r_y1": 165.9, "r_x2": 143.27, "r_y2": 157.06, "r_x3": 118.87, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.77, "r_y0": 165.9, "r_x1": 165.9, "r_y1": 165.9, "r_x2": 165.9, "r_y2": 157.06, "r_x3": 143.77, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12, "r_y0": 165.9, "r_x1": 175.87, "r_y1": 165.9, "r_x2": 175.87, "r_y2": 156.5, "r_x3": 168.12, "r_y3": 156.5, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.28, "r_y0": 159.16, "r_x1": 221.96, "r_y1": 159.16, "r_x2": 221.96, "r_y2": 150.32, "r_x3": 179.28, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95, "r_y0": 159.16, "r_x1": 246.35, "r_y1": 159.16, "r_x2": 246.35, "r_y2": 150.32, "r_x3": 221.95, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84, "r_y0": 159.16, "r_x1": 250.72, "r_y1": 159.16, "r_x2": 250.72, "r_y2": 150.32, "r_x3": 246.84, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21, "r_y0": 172.74, "r_x1": 206.29, "r_y1": 172.74, "r_x2": 206.29, "r_y2": 163.89, "r_x3": 182.21, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.29, "r_y0": 172.74, "r_x1": 209.06, "r_y1": 172.74, "r_x2": 209.06, "r_y2": 163.33, "r_x3": 206.29, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.06, "r_y0": 172.74, "r_x1": 219.2, "r_y1": 172.74, "r_x2": 219.2, "r_y2": 163.89, "r_x3": 209.06, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.7, "r_y0": 172.74, "r_x1": 222.46, "r_y1": 172.74, "r_x2": 222.46, "r_y2": 163.33, "r_x3": 219.7, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.12, "r_y0": 172.74, "r_x1": 226.89, "r_y1": 172.74, "r_x2": 226.89, "r_y2": 163.89, "r_x3": 224.12, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55, "r_y0": 172.74, "r_x1": 231.32, "r_y1": 172.74, "r_x2": 231.32, "r_y2": 163.33, "r_x3": 228.55, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.32, "r_y0": 172.74, "r_x1": 240.65, "r_y1": 172.74, "r_x2": 240.65, "r_y2": 163.89, "r_x3": 231.32, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.14, "r_y0": 172.74, "r_x1": 243.91, "r_y1": 172.74, "r_x2": 243.91, "r_y2": 163.33, "r_x3": 241.14, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.91, "r_y0": 172.74, "r_x1": 247.79, "r_y1": 172.74, "r_x2": 247.79, "r_y2": 163.89, "r_x3": 243.91, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 166.12, "r_x1": 286.36, "r_y1": 166.12, "r_x2": 286.36, "r_y2": 157.22, "r_x3": 274.75, "r_y3": 157.22, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 181.0, "r": 286.36, "b": 213.98, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 190.07, "r_x1": 86.41, "r_y1": 190.07, "r_x2": 86.41, "r_y2": 181.16, "r_x3": 62.07, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.58, "r_y0": 189.85, "r_x1": 98.72, "r_y1": 189.85, "r_x2": 98.72, "r_y2": 181.0, "r_x3": 88.58, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.4, "r_y0": 190.07, "r_x1": 115.78, "r_y1": 190.07, "r_x2": 115.78, "r_y2": 181.16, "r_x3": 101.4, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.96, "r_y0": 189.85, "r_x1": 127.29, "r_y1": 189.85, "r_x2": 127.29, "r_y2": 181.0, "r_x3": 117.96, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.96, "r_y0": 190.07, "r_x1": 286.36, "r_y1": 190.07, "r_x2": 286.36, "r_y2": 181.16, "r_x3": 129.96, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 202.02, "r_x1": 252.78, "r_y1": 202.02, "r_x2": 252.78, "r_y2": 193.12, "r_x3": 50.11, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18, "r_y0": 201.8, "r_x1": 257.95, "r_y1": 201.8, "r_x2": 257.95, "r_y2": 192.4, "r_x3": 255.18, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.95, "r_y0": 201.8, "r_x1": 263.77, "r_y1": 201.8, "r_x2": 263.77, "r_y2": 192.96, "r_x3": 257.95, "r_y3": 192.96, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.15, "r_y0": 201.8, "r_x1": 267.92, "r_y1": 201.8, "r_x2": 267.92, "r_y2": 192.4, "r_x3": 265.15, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32, "r_y0": 202.02, "r_x1": 286.36, "r_y1": 202.02, "r_x2": 286.36, "r_y2": 193.12, "r_x3": 270.32, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.98, "r_x1": 172.13, "r_y1": 213.98, "r_x2": 172.13, "r_y2": 205.07, "r_x3": 50.11, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62, "r_y0": 213.76, "r_x1": 180.45, "r_y1": 213.76, "r_x2": 180.45, "r_y2": 204.91, "r_x3": 174.62, "r_y3": 204.91, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.83, "r_y0": 213.98, "r_x1": 184.32, "r_y1": 213.98, "r_x2": 184.32, "r_y2": 205.07, "r_x3": 181.83, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "section_header", "bbox": { "l": 50.11, "t": 224.82, "r": 170.45, "b": 234.67, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 234.67, "r_x1": 64.55, "r_y1": 234.67, "r_x2": 64.55, "r_y2": 224.82, "r_x3": 50.11, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.18, "r_y0": 234.67, "r_x1": 170.45, "r_y1": 234.67, "r_x2": 170.45, "r_y2": 224.82, "r_x3": 74.18, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 243.65, "r": 286.37, "b": 396.14, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.61, "r_x1": 105.32, "r_y1": 252.61, "r_x2": 105.32, "r_y2": 243.65, "r_x3": 62.07, "r_y3": 243.65, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.13, "r_y0": 252.68, "r_x1": 184.68, "r_y1": 252.68, "r_x2": 184.68, "r_y2": 243.77, "r_x3": 112.13, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.48, "r_y0": 252.68, "r_x1": 286.36, "r_y1": 252.68, "r_x2": 286.36, "r_y2": 243.77, "r_x3": 191.48, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.63, "r_x1": 286.37, "r_y1": 264.63, "r_x2": 286.37, "r_y2": 255.72, "r_x3": 50.11, "r_y3": 255.72, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.59, "r_x1": 286.37, "r_y1": 276.59, "r_x2": 286.37, "r_y2": 267.68, "r_x3": 50.11, "r_y3": 267.68, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.54, "r_x1": 286.37, "r_y1": 288.54, "r_x2": 286.37, "r_y2": 279.63, "r_x3": 50.11, "r_y3": 279.63, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.5, "r_x1": 286.37, "r_y1": 300.5, "r_x2": 286.37, "r_y2": 291.59, "r_x3": 50.11, "r_y3": 291.59, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.45, "r_x1": 286.37, "r_y1": 312.45, "r_x2": 286.37, "r_y2": 303.55, "r_x3": 50.11, "r_y3": 303.55, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.41, "r_x1": 286.37, "r_y1": 324.41, "r_x2": 286.37, "r_y2": 315.5, "r_x3": 50.11, "r_y3": 315.5, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.36, "r_x1": 286.37, "r_y1": 336.36, "r_x2": 286.37, "r_y2": 327.46, "r_x3": 50.11, "r_y3": 327.46, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.32, "r_x1": 286.37, "r_y1": 348.32, "r_x2": 286.37, "r_y2": 339.41, "r_x3": 50.11, "r_y3": 339.41, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.27, "r_x1": 286.37, "r_y1": 360.27, "r_x2": 286.37, "r_y2": 351.37, "r_x3": 50.11, "r_y3": 351.37, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.23, "r_x1": 286.37, "r_y1": 372.23, "r_x2": 286.37, "r_y2": 363.32, "r_x3": 50.11, "r_y3": 363.32, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.18, "r_x1": 286.37, "r_y1": 384.18, "r_x2": 286.37, "r_y2": 375.28, "r_x3": 50.11, "r_y3": 375.28, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.14, "r_x1": 170.01, "r_y1": 396.14, "r_x2": 170.01, "r_y2": 387.23, "r_x3": 50.11, "r_y3": 387.23, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 53.37, "t": 409.14, "r": 283.04, "b": 582.4, "coord_origin": "TOPLEFT" }, "confidence": 0.989, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36, "t": 426.67, "r": 247.74, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 15, "label": "text", "bbox": { "l": 50.11, "t": 592.43, "r": 286.37, "b": 613.29, "coord_origin": "TOPLEFT" }, "confidence": 0.721, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 601.34, "r_x1": 286.37, "r_y1": 601.34, "r_x2": 286.37, "r_y2": 592.43, "r_x3": 50.11, "r_y3": 592.43, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 613.29, "r_x1": 247.46, "r_y1": 613.29, "r_x2": 247.46, "r_y2": 604.39, "r_x3": 50.11, "r_y3": 604.39, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 616.34, "r": 261.79, "b": 625.25, "coord_origin": "TOPLEFT" }, "confidence": 0.643, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 625.25, "r_x1": 261.79, "r_y1": 625.25, "r_x2": 261.79, "r_y2": 616.34, "r_x3": 50.11, "r_y3": 616.34, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 644.35, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 653.31, "r_x1": 124.72, "r_y1": 653.31, "r_x2": 124.72, "r_y2": 644.35, "r_x3": 62.07, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.2, "r_y0": 653.38, "r_x1": 242.93, "r_y1": 653.38, "r_x2": 242.93, "r_y2": 644.47, "r_x3": 128.2, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55, "r_y0": 653.15, "r_x1": 286.36, "r_y1": 653.15, "r_x2": 286.36, "r_y2": 644.56, "r_x3": 245.55, "r_y3": 644.56, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.1, "r_x1": 84.97, "r_y1": 665.1, "r_x2": 84.97, "r_y2": 656.51, "r_x3": 50.11, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.52, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 89.52, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 227.58, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 322.14, "r_y1": 84.11, "r_x2": 322.14, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45, "r_y0": 83.89, "r_x1": 404.57, "r_y1": 83.89, "r_x2": 404.57, "r_y2": 75.3, "r_x3": 325.45, "r_y3": 75.3, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.1, "r_y0": 84.11, "r_x1": 545.11, "r_y1": 84.11, "r_x2": 545.11, "r_y2": 75.21, "r_x3": 408.1, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 470.23, "r_y1": 108.02, "r_x2": 470.23, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.53, "r_y0": 108.02, "r_x1": 545.12, "r_y1": 108.02, "r_x2": 545.12, "r_y2": 99.12, "r_x3": 477.53, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 119.98, "r_x1": 545.12, "r_y1": 119.98, "r_x2": 545.12, "r_y2": 111.07, "r_x3": 308.86, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 131.93, "r_x1": 545.12, "r_y1": 131.93, "r_x2": 545.12, "r_y2": 123.03, "r_x3": 308.86, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 143.89, "r_x1": 502.02, "r_y1": 143.89, "r_x2": 502.02, "r_y2": 134.98, "r_x3": 308.86, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47, "r_y0": 143.66, "r_x1": 545.11, "r_y1": 143.66, "r_x2": 545.11, "r_y2": 135.07, "r_x3": 504.47, "r_y3": 135.07, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 155.62, "r_x1": 343.16, "r_y1": 155.62, "r_x2": 343.16, "r_y2": 147.03, "r_x3": 308.86, "r_y3": 147.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37, "r_y0": 155.85, "r_x1": 545.11, "r_y1": 155.85, "r_x2": 545.11, "r_y2": 146.94, "r_x3": 346.37, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 167.8, "r_x1": 446.16, "r_y1": 167.8, "r_x2": 446.16, "r_y2": 158.89, "r_x3": 308.86, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.29, "r_y0": 167.57, "r_x1": 525.04, "r_y1": 167.57, "r_x2": 525.04, "r_y2": 158.98, "r_x3": 448.29, "r_y3": 158.98, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.4, "r_y0": 167.8, "r_x1": 545.11, "r_y1": 167.8, "r_x2": 545.11, "r_y2": 158.89, "r_x3": 527.4, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 179.76, "r_x1": 545.12, "r_y1": 179.76, "r_x2": 545.12, "r_y2": 170.85, "r_x3": 308.86, "r_y3": 170.85, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 191.71, "r_x1": 432.87, "r_y1": 191.71, "r_x2": 432.87, "r_y2": 182.8, "r_x3": 308.86, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39, "r_y0": 191.48, "r_x1": 510.93, "r_y1": 191.48, "r_x2": 510.93, "r_y2": 182.89, "r_x3": 436.39, "r_y3": 182.89, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.68, "r_y0": 191.71, "r_x1": 545.11, "r_y1": 191.71, "r_x2": 545.11, "r_y2": 182.8, "r_x3": 514.68, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 203.67, "r_x1": 431.17, "r_y1": 203.67, "r_x2": 431.17, "r_y2": 194.76, "r_x3": 308.86, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.68, "r_y0": 203.44, "r_x1": 514.18, "r_y1": 203.44, "r_x2": 514.18, "r_y2": 194.85, "r_x3": 434.68, "r_y3": 194.85, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.18, "r_y0": 203.67, "r_x1": 545.11, "r_y1": 203.67, "r_x2": 545.11, "r_y2": 194.76, "r_x3": 514.18, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 215.39, "r_x1": 382.36, "r_y1": 215.39, "r_x2": 382.36, "r_y2": 206.81, "r_x3": 308.86, "r_y3": 206.81, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.08, "r_y0": 215.62, "r_x1": 545.11, "r_y1": 215.62, "r_x2": 545.11, "r_y2": 206.72, "r_x3": 385.08, "r_y3": 206.72, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 227.58, "r_x1": 501.7, "r_y1": 227.58, "r_x2": 501.7, "r_y2": 218.67, "r_x3": 308.86, "r_y3": 218.67, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 308.41, "t": 247.88, "r": 533.64, "b": 303.81, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 12, "label": "caption", "bbox": { "l": 308.86, "t": 316.45, "r": 545.12, "b": 337.31, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 325.36, "r_x1": 341.5, "r_y1": 325.36, "r_x2": 341.5, "r_y2": 316.45, "r_x3": 308.86, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.6, "r_y0": 325.36, "r_x1": 545.12, "r_y1": 325.36, "r_x2": 545.12, "r_y2": 316.45, "r_x3": 348.6, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.31, "r_x1": 474.98, "r_y1": 337.31, "r_x2": 474.98, "r_y2": 328.4, "r_x3": 308.86, "r_y3": 328.4, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 367.68, "r": 545.12, "b": 520.17, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 376.64, "r_x1": 378.95, "r_y1": 376.64, "r_x2": 378.95, "r_y2": 367.68, "r_x3": 320.82, "r_y3": 367.68, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.08, "r_y0": 376.71, "r_x1": 545.12, "r_y1": 376.71, "r_x2": 545.12, "r_y2": 367.8, "r_x3": 387.08, "r_y3": 367.8, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.66, "r_x1": 487.19, "r_y1": 388.66, "r_x2": 487.19, "r_y2": 379.75, "r_x3": 308.86, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.97, "r_y0": 388.66, "r_x1": 545.12, "r_y1": 388.66, "r_x2": 545.12, "r_y2": 379.75, "r_x3": 493.97, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.62, "r_x1": 545.12, "r_y1": 400.62, "r_x2": 545.12, "r_y2": 391.71, "r_x3": 308.86, "r_y3": 391.71, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.57, "r_x1": 545.12, "r_y1": 412.57, "r_x2": 545.12, "r_y2": 403.67, "r_x3": 308.86, "r_y3": 403.67, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.53, "r_x1": 314.08, "r_y1": 424.53, "r_x2": 314.08, "r_y2": 415.62, "r_x3": 308.86, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69, "r_y0": 424.53, "r_x1": 545.12, "r_y1": 424.53, "r_x2": 545.12, "r_y2": 415.62, "r_x3": 316.69, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.48, "r_x1": 545.12, "r_y1": 436.48, "r_x2": 545.12, "r_y2": 427.58, "r_x3": 308.86, "r_y3": 427.58, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.44, "r_x1": 545.12, "r_y1": 448.44, "r_x2": 545.12, "r_y2": 439.53, "r_x3": 308.86, "r_y3": 439.53, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 460.39, "r_x1": 350.24, "r_y1": 460.39, "r_x2": 350.24, "r_y2": 451.49, "r_x3": 308.86, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.18, "r_y0": 460.32, "r_x1": 374.59, "r_y1": 460.32, "r_x2": 374.59, "r_y2": 451.37, "r_x3": 352.18, "r_y3": 451.37, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53, "r_y0": 460.39, "r_x1": 545.11, "r_y1": 460.39, "r_x2": 545.11, "r_y2": 451.49, "r_x3": 376.53, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 472.35, "r_x1": 545.12, "r_y1": 472.35, "r_x2": 545.12, "r_y2": 463.44, "r_x3": 308.86, "r_y3": 463.44, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.3, "r_x1": 545.12, "r_y1": 484.3, "r_x2": 545.12, "r_y2": 475.4, "r_x3": 308.86, "r_y3": 475.4, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.26, "r_x1": 545.12, "r_y1": 496.26, "r_x2": 545.12, "r_y2": 487.35, "r_x3": 308.86, "r_y3": 487.35, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.21, "r_x1": 545.12, "r_y1": 508.21, "r_x2": 545.12, "r_y2": 499.31, "r_x3": 308.86, "r_y3": 499.31, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.17, "r_x1": 405.7, "r_y1": 520.17, "r_x2": 405.7, "r_y2": 511.26, "r_x3": 308.86, "r_y3": 511.26, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "table", "bbox": { "l": 332.97, "t": 540.28, "r": 520.94, "b": 643.27, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.7, "t": 558.21, "r": 485.08, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 656.86, "r": 545.12, "b": 689.68, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.77, "r_x1": 341.74, "r_y1": 665.77, "r_x2": 341.74, "r_y2": 656.86, "r_x3": 308.86, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.56, "r_y0": 665.77, "r_x1": 545.12, "r_y1": 665.77, "r_x2": 545.12, "r_y2": 656.86, "r_x3": 349.56, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.72, "r_x1": 545.12, "r_y1": 677.72, "r_x2": 545.12, "r_y2": 668.82, "r_x3": 308.86, "r_y3": 668.82, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.68, "r_x1": 435.04, "r_y1": 689.68, "r_x2": 435.04, "r_y2": 680.77, "r_x3": 308.86, "r_y3": 680.77, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.879, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.37, "t": 409.14, "r": 283.04, "b": 582.4, "coord_origin": "TOPLEFT" }, "confidence": 0.989, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36, "t": 426.67, "r": 247.74, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, "8": { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.41, "t": 247.88, "r": 533.64, "b": 303.81, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, "5": { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.97, "t": 540.28, "r": 520.94, "b": 643.27, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.7, "t": 558.21, "r": 485.08, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 50.11, "t": 74.4, "r": 167.9, "b": 84.25, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.25, "r_x1": 63.7, "r_y1": 84.25, "r_x2": 63.7, "r_y2": 74.4, "r_x3": 50.11, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.77, "r_y0": 84.25, "r_x1": 167.9, "r_y1": 84.25, "r_x2": 167.9, "r_y2": 74.4, "r_x3": 72.77, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3. Datasets and Metrics" }, { "label": "text", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 93.35, "r": 286.37, "b": 138.12, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 102.26, "r_x1": 286.36, "r_y1": 102.26, "r_x2": 286.36, "r_y2": 93.35, "r_x3": 62.07, "r_y3": 93.35, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 114.21, "r_x1": 286.37, "r_y1": 114.21, "r_x2": 286.37, "r_y2": 105.31, "r_x3": 50.11, "r_y3": 105.31, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 126.17, "r_x1": 286.37, "r_y1": 126.17, "r_x2": 286.37, "r_y2": 117.26, "r_x3": 50.11, "r_y3": 117.26, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 138.12, "r_x1": 136.72, "r_y1": 138.12, "r_x2": 136.72, "r_y2": 129.22, "r_x3": 50.11, "r_y3": 129.22, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:" }, { "label": "formula", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "formula", "bbox": { "l": 86.22, "t": 150.32, "r": 286.36, "b": 172.74, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.22, "r_y0": 165.9, "r_x1": 118.88, "r_y1": 165.9, "r_x2": 118.88, "r_y2": 157.06, "r_x3": 86.22, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87, "r_y0": 165.9, "r_x1": 143.27, "r_y1": 165.9, "r_x2": 143.27, "r_y2": 157.06, "r_x3": 118.87, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.77, "r_y0": 165.9, "r_x1": 165.9, "r_y1": 165.9, "r_x2": 165.9, "r_y2": 157.06, "r_x3": 143.77, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12, "r_y0": 165.9, "r_x1": 175.87, "r_y1": 165.9, "r_x2": 175.87, "r_y2": 156.5, "r_x3": 168.12, "r_y3": 156.5, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.28, "r_y0": 159.16, "r_x1": 221.96, "r_y1": 159.16, "r_x2": 221.96, "r_y2": 150.32, "r_x3": 179.28, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95, "r_y0": 159.16, "r_x1": 246.35, "r_y1": 159.16, "r_x2": 246.35, "r_y2": 150.32, "r_x3": 221.95, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84, "r_y0": 159.16, "r_x1": 250.72, "r_y1": 159.16, "r_x2": 250.72, "r_y2": 150.32, "r_x3": 246.84, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21, "r_y0": 172.74, "r_x1": 206.29, "r_y1": 172.74, "r_x2": 206.29, "r_y2": 163.89, "r_x3": 182.21, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.29, "r_y0": 172.74, "r_x1": 209.06, "r_y1": 172.74, "r_x2": 209.06, "r_y2": 163.33, "r_x3": 206.29, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.06, "r_y0": 172.74, "r_x1": 219.2, "r_y1": 172.74, "r_x2": 219.2, "r_y2": 163.89, "r_x3": 209.06, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.7, "r_y0": 172.74, "r_x1": 222.46, "r_y1": 172.74, "r_x2": 222.46, "r_y2": 163.33, "r_x3": 219.7, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.12, "r_y0": 172.74, "r_x1": 226.89, "r_y1": 172.74, "r_x2": 226.89, "r_y2": 163.89, "r_x3": 224.12, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55, "r_y0": 172.74, "r_x1": 231.32, "r_y1": 172.74, "r_x2": 231.32, "r_y2": 163.33, "r_x3": 228.55, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.32, "r_y0": 172.74, "r_x1": 240.65, "r_y1": 172.74, "r_x2": 240.65, "r_y2": 163.89, "r_x3": 231.32, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.14, "r_y0": 172.74, "r_x1": 243.91, "r_y1": 172.74, "r_x2": 243.91, "r_y2": 163.33, "r_x3": 241.14, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.91, "r_y0": 172.74, "r_x1": 247.79, "r_y1": 172.74, "r_x2": 247.79, "r_y2": 163.89, "r_x3": 243.91, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 166.12, "r_x1": 286.36, "r_y1": 166.12, "r_x2": 286.36, "r_y2": 157.22, "r_x3": 274.75, "r_y3": 157.22, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)" }, { "label": "text", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 181.0, "r": 286.36, "b": 213.98, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 190.07, "r_x1": 86.41, "r_y1": 190.07, "r_x2": 86.41, "r_y2": 181.16, "r_x3": 62.07, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.58, "r_y0": 189.85, "r_x1": 98.72, "r_y1": 189.85, "r_x2": 98.72, "r_y2": 181.0, "r_x3": 88.58, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.4, "r_y0": 190.07, "r_x1": 115.78, "r_y1": 190.07, "r_x2": 115.78, "r_y2": 181.16, "r_x3": 101.4, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.96, "r_y0": 189.85, "r_x1": 127.29, "r_y1": 189.85, "r_x2": 127.29, "r_y2": 181.0, "r_x3": 117.96, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.96, "r_y0": 190.07, "r_x1": 286.36, "r_y1": 190.07, "r_x2": 286.36, "r_y2": 181.16, "r_x3": 129.96, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 202.02, "r_x1": 252.78, "r_y1": 202.02, "r_x2": 252.78, "r_y2": 193.12, "r_x3": 50.11, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18, "r_y0": 201.8, "r_x1": 257.95, "r_y1": 201.8, "r_x2": 257.95, "r_y2": 192.4, "r_x3": 255.18, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.95, "r_y0": 201.8, "r_x1": 263.77, "r_y1": 201.8, "r_x2": 263.77, "r_y2": 192.96, "r_x3": 257.95, "r_y3": 192.96, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.15, "r_y0": 201.8, "r_x1": 267.92, "r_y1": 201.8, "r_x2": 267.92, "r_y2": 192.4, "r_x3": 265.15, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32, "r_y0": 202.02, "r_x1": 286.36, "r_y1": 202.02, "r_x2": 286.36, "r_y2": 193.12, "r_x3": 270.32, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.98, "r_x1": 172.13, "r_y1": 213.98, "r_x2": 172.13, "r_y2": 205.07, "r_x3": 50.11, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62, "r_y0": 213.76, "r_x1": 180.45, "r_y1": 213.76, "r_x2": 180.45, "r_y2": 204.91, "r_x3": 174.62, "r_y3": 204.91, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.83, "r_y0": 213.98, "r_x1": 184.32, "r_y1": 213.98, "r_x2": 184.32, "r_y2": 205.07, "r_x3": 181.83, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ." }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 50.11, "t": 224.82, "r": 170.45, "b": 234.67, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 234.67, "r_x1": 64.55, "r_y1": 234.67, "r_x2": 64.55, "r_y2": 224.82, "r_x3": 50.11, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.18, "r_y0": 234.67, "r_x1": 170.45, "r_y1": 234.67, "r_x2": 170.45, "r_y2": 224.82, "r_x3": 74.18, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.4. Quantitative Analysis" }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 243.65, "r": 286.37, "b": 396.14, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.61, "r_x1": 105.32, "r_y1": 252.61, "r_x2": 105.32, "r_y2": 243.65, "r_x3": 62.07, "r_y3": 243.65, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.13, "r_y0": 252.68, "r_x1": 184.68, "r_y1": 252.68, "r_x2": 184.68, "r_y2": 243.77, "r_x3": 112.13, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.48, "r_y0": 252.68, "r_x1": 286.36, "r_y1": 252.68, "r_x2": 286.36, "r_y2": 243.77, "r_x3": 191.48, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.63, "r_x1": 286.37, "r_y1": 264.63, "r_x2": 286.37, "r_y2": 255.72, "r_x3": 50.11, "r_y3": 255.72, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.59, "r_x1": 286.37, "r_y1": 276.59, "r_x2": 286.37, "r_y2": 267.68, "r_x3": 50.11, "r_y3": 267.68, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.54, "r_x1": 286.37, "r_y1": 288.54, "r_x2": 286.37, "r_y2": 279.63, "r_x3": 50.11, "r_y3": 279.63, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.5, "r_x1": 286.37, "r_y1": 300.5, "r_x2": 286.37, "r_y2": 291.59, "r_x3": 50.11, "r_y3": 291.59, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.45, "r_x1": 286.37, "r_y1": 312.45, "r_x2": 286.37, "r_y2": 303.55, "r_x3": 50.11, "r_y3": 303.55, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.41, "r_x1": 286.37, "r_y1": 324.41, "r_x2": 286.37, "r_y2": 315.5, "r_x3": 50.11, "r_y3": 315.5, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.36, "r_x1": 286.37, "r_y1": 336.36, "r_x2": 286.37, "r_y2": 327.46, "r_x3": 50.11, "r_y3": 327.46, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.32, "r_x1": 286.37, "r_y1": 348.32, "r_x2": 286.37, "r_y2": 339.41, "r_x3": 50.11, "r_y3": 339.41, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.27, "r_x1": 286.37, "r_y1": 360.27, "r_x2": 286.37, "r_y2": 351.37, "r_x3": 50.11, "r_y3": 351.37, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.23, "r_x1": 286.37, "r_y1": 372.23, "r_x2": 286.37, "r_y2": 363.32, "r_x3": 50.11, "r_y3": 363.32, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.18, "r_x1": 286.37, "r_y1": 384.18, "r_x2": 286.37, "r_y2": 375.28, "r_x3": 50.11, "r_y3": 375.28, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.14, "r_x1": 170.01, "r_y1": 396.14, "r_x2": 170.01, "r_y2": 387.23, "r_x3": 50.11, "r_y3": 387.23, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size." }, { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.37, "t": 409.14, "r": 283.04, "b": 582.4, "coord_origin": "TOPLEFT" }, "confidence": 0.989, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36, "t": 426.67, "r": 247.74, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "text", "id": 15, "page_no": 6, "cluster": { "id": 15, "label": "text", "bbox": { "l": 50.11, "t": 592.43, "r": 286.37, "b": 613.29, "coord_origin": "TOPLEFT" }, "confidence": 0.721, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 601.34, "r_x1": 286.37, "r_y1": 601.34, "r_x2": 286.37, "r_y2": 592.43, "r_x3": 50.11, "r_y3": 592.43, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 613.29, "r_x1": 247.46, "r_y1": 613.29, "r_x2": 247.46, "r_y2": 604.39, "r_x3": 50.11, "r_y3": 604.39, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)." }, { "label": "text", "id": 16, "page_no": 6, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 616.34, "r": 261.79, "b": 625.25, "coord_origin": "TOPLEFT" }, "confidence": 0.643, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 625.25, "r_x1": 261.79, "r_y1": 625.25, "r_x2": 261.79, "r_y2": 616.34, "r_x3": 50.11, "r_y3": 616.34, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "FT: Model was trained on PubTabNet then finetuned." }, { "label": "text", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 644.35, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 653.31, "r_x1": 124.72, "r_y1": 653.31, "r_x2": 124.72, "r_y2": 644.35, "r_x3": 62.07, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.2, "r_y0": 653.38, "r_x1": 242.93, "r_y1": 653.38, "r_x2": 242.93, "r_y2": 644.47, "r_x3": 128.2, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55, "r_y0": 653.15, "r_x1": 286.36, "r_y1": 653.15, "r_x2": 286.36, "r_y2": 644.56, "r_x3": 245.55, "r_y3": 644.56, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.1, "r_x1": 84.97, "r_y1": 665.1, "r_x2": 84.97, "r_y2": 656.51, "r_x3": 50.11, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.52, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 89.52, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate" }, { "label": "text", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 227.58, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 322.14, "r_y1": 84.11, "r_x2": 322.14, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45, "r_y0": 83.89, "r_x1": 404.57, "r_y1": 83.89, "r_x2": 404.57, "r_y2": 75.3, "r_x3": 325.45, "r_y3": 75.3, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.1, "r_y0": 84.11, "r_x1": 545.11, "r_y1": 84.11, "r_x2": 545.11, "r_y2": 75.21, "r_x3": 408.1, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 470.23, "r_y1": 108.02, "r_x2": 470.23, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.53, "r_y0": 108.02, "r_x1": 545.12, "r_y1": 108.02, "r_x2": 545.12, "r_y2": 99.12, "r_x3": 477.53, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 119.98, "r_x1": 545.12, "r_y1": 119.98, "r_x2": 545.12, "r_y2": 111.07, "r_x3": 308.86, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 131.93, "r_x1": 545.12, "r_y1": 131.93, "r_x2": 545.12, "r_y2": 123.03, "r_x3": 308.86, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 143.89, "r_x1": 502.02, "r_y1": 143.89, "r_x2": 502.02, "r_y2": 134.98, "r_x3": 308.86, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47, "r_y0": 143.66, "r_x1": 545.11, "r_y1": 143.66, "r_x2": 545.11, "r_y2": 135.07, "r_x3": 504.47, "r_y3": 135.07, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 155.62, "r_x1": 343.16, "r_y1": 155.62, "r_x2": 343.16, "r_y2": 147.03, "r_x3": 308.86, "r_y3": 147.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37, "r_y0": 155.85, "r_x1": 545.11, "r_y1": 155.85, "r_x2": 545.11, "r_y2": 146.94, "r_x3": 346.37, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 167.8, "r_x1": 446.16, "r_y1": 167.8, "r_x2": 446.16, "r_y2": 158.89, "r_x3": 308.86, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.29, "r_y0": 167.57, "r_x1": 525.04, "r_y1": 167.57, "r_x2": 525.04, "r_y2": 158.98, "r_x3": 448.29, "r_y3": 158.98, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.4, "r_y0": 167.8, "r_x1": 545.11, "r_y1": 167.8, "r_x2": 545.11, "r_y2": 158.89, "r_x3": 527.4, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 179.76, "r_x1": 545.12, "r_y1": 179.76, "r_x2": 545.12, "r_y2": 170.85, "r_x3": 308.86, "r_y3": 170.85, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 191.71, "r_x1": 432.87, "r_y1": 191.71, "r_x2": 432.87, "r_y2": 182.8, "r_x3": 308.86, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39, "r_y0": 191.48, "r_x1": 510.93, "r_y1": 191.48, "r_x2": 510.93, "r_y2": 182.89, "r_x3": 436.39, "r_y3": 182.89, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.68, "r_y0": 191.71, "r_x1": 545.11, "r_y1": 191.71, "r_x2": 545.11, "r_y2": 182.8, "r_x3": 514.68, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 203.67, "r_x1": 431.17, "r_y1": 203.67, "r_x2": 431.17, "r_y2": 194.76, "r_x3": 308.86, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.68, "r_y0": 203.44, "r_x1": 514.18, "r_y1": 203.44, "r_x2": 514.18, "r_y2": 194.85, "r_x3": 434.68, "r_y3": 194.85, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.18, "r_y0": 203.67, "r_x1": 545.11, "r_y1": 203.67, "r_x2": 545.11, "r_y2": 194.76, "r_x3": 514.18, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 215.39, "r_x1": 382.36, "r_y1": 215.39, "r_x2": 382.36, "r_y2": 206.81, "r_x3": 308.86, "r_y3": 206.81, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.08, "r_y0": 215.62, "r_x1": 545.11, "r_y1": 215.62, "r_x2": 545.11, "r_y2": 206.72, "r_x3": 385.08, "r_y3": 206.72, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 227.58, "r_x1": 501.7, "r_y1": 227.58, "r_x2": 501.7, "r_y2": 218.67, "r_x3": 308.86, "r_y3": 218.67, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes." }, { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.41, "t": 247.88, "r": 533.64, "b": 303.81, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "caption", "bbox": { "l": 308.86, "t": 316.45, "r": 545.12, "b": 337.31, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 325.36, "r_x1": 341.5, "r_y1": 325.36, "r_x2": 341.5, "r_y2": 316.45, "r_x3": 308.86, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.6, "r_y0": 325.36, "r_x1": 545.12, "r_y1": 325.36, "r_x2": 545.12, "r_y2": 316.45, "r_x3": 348.6, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.31, "r_x1": 474.98, "r_y1": 337.31, "r_x2": 474.98, "r_y2": 328.4, "r_x3": 308.86, "r_y3": 328.4, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing." }, { "label": "text", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 367.68, "r": 545.12, "b": 520.17, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 376.64, "r_x1": 378.95, "r_y1": 376.64, "r_x2": 378.95, "r_y2": 367.68, "r_x3": 320.82, "r_y3": 367.68, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.08, "r_y0": 376.71, "r_x1": 545.12, "r_y1": 376.71, "r_x2": 545.12, "r_y2": 367.8, "r_x3": 387.08, "r_y3": 367.8, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.66, "r_x1": 487.19, "r_y1": 388.66, "r_x2": 487.19, "r_y2": 379.75, "r_x3": 308.86, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.97, "r_y0": 388.66, "r_x1": 545.12, "r_y1": 388.66, "r_x2": 545.12, "r_y2": 379.75, "r_x3": 493.97, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.62, "r_x1": 545.12, "r_y1": 400.62, "r_x2": 545.12, "r_y2": 391.71, "r_x3": 308.86, "r_y3": 391.71, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.57, "r_x1": 545.12, "r_y1": 412.57, "r_x2": 545.12, "r_y2": 403.67, "r_x3": 308.86, "r_y3": 403.67, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.53, "r_x1": 314.08, "r_y1": 424.53, "r_x2": 314.08, "r_y2": 415.62, "r_x3": 308.86, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69, "r_y0": 424.53, "r_x1": 545.12, "r_y1": 424.53, "r_x2": 545.12, "r_y2": 415.62, "r_x3": 316.69, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.48, "r_x1": 545.12, "r_y1": 436.48, "r_x2": 545.12, "r_y2": 427.58, "r_x3": 308.86, "r_y3": 427.58, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.44, "r_x1": 545.12, "r_y1": 448.44, "r_x2": 545.12, "r_y2": 439.53, "r_x3": 308.86, "r_y3": 439.53, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 460.39, "r_x1": 350.24, "r_y1": 460.39, "r_x2": 350.24, "r_y2": 451.49, "r_x3": 308.86, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.18, "r_y0": 460.32, "r_x1": 374.59, "r_y1": 460.32, "r_x2": 374.59, "r_y2": 451.37, "r_x3": 352.18, "r_y3": 451.37, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53, "r_y0": 460.39, "r_x1": 545.11, "r_y1": 460.39, "r_x2": 545.11, "r_y2": 451.49, "r_x3": 376.53, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 472.35, "r_x1": 545.12, "r_y1": 472.35, "r_x2": 545.12, "r_y2": 463.44, "r_x3": 308.86, "r_y3": 463.44, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.3, "r_x1": 545.12, "r_y1": 484.3, "r_x2": 545.12, "r_y2": 475.4, "r_x3": 308.86, "r_y3": 475.4, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.26, "r_x1": 545.12, "r_y1": 496.26, "r_x2": 545.12, "r_y2": 487.35, "r_x3": 308.86, "r_y3": 487.35, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.21, "r_x1": 545.12, "r_y1": 508.21, "r_x2": 545.12, "r_y2": 499.31, "r_x3": 308.86, "r_y3": 499.31, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.17, "r_x1": 405.7, "r_y1": 520.17, "r_x2": 405.7, "r_y2": 511.26, "r_x3": 308.86, "r_y3": 511.26, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations." }, { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.97, "t": 540.28, "r": 520.94, "b": 643.27, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.7, "t": 558.21, "r": 485.08, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 656.86, "r": 545.12, "b": 689.68, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.77, "r_x1": 341.74, "r_y1": 665.77, "r_x2": 341.74, "r_y2": 656.86, "r_x3": 308.86, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.56, "r_y0": 665.77, "r_x1": 545.12, "r_y1": 665.77, "r_x2": 545.12, "r_y2": 656.86, "r_x3": 349.56, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.72, "r_x1": 545.12, "r_y1": 677.72, "r_x2": 545.12, "r_y2": 668.82, "r_x3": 308.86, "r_y3": 668.82, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.68, "r_x1": 435.04, "r_y1": 689.68, "r_x2": 435.04, "r_y2": 680.77, "r_x3": 308.86, "r_y3": 680.77, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables." }, { "label": "page_footer", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.879, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ], "body": [ { "label": "section_header", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 50.11, "t": 74.4, "r": 167.9, "b": 84.25, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.25, "r_x1": 63.7, "r_y1": 84.25, "r_x2": 63.7, "r_y2": 74.4, "r_x3": 50.11, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "5.3.", "orig": "5.3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.77, "r_y0": 84.25, "r_x1": 167.9, "r_y1": 84.25, "r_x2": 167.9, "r_y2": 74.4, "r_x3": 72.77, "r_y3": 74.4, "coord_origin": "TOPLEFT" }, "text": "Datasets and Metrics", "orig": "Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3. Datasets and Metrics" }, { "label": "text", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 93.35, "r": 286.37, "b": 138.12, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 102.26, "r_x1": 286.36, "r_y1": 102.26, "r_x2": 286.36, "r_y2": 93.35, "r_x3": 62.07, "r_y3": 93.35, "coord_origin": "TOPLEFT" }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 114.21, "r_x1": 286.37, "r_y1": 114.21, "r_x2": 286.37, "r_y2": 105.31, "r_x3": 50.11, "r_y3": 105.31, "coord_origin": "TOPLEFT" }, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 126.17, "r_x1": 286.37, "r_y1": 126.17, "r_x2": 286.37, "r_y2": 117.26, "r_x3": 50.11, "r_y3": 117.26, "coord_origin": "TOPLEFT" }, "text": "ground-truth as a tree structure of HTML tags. This simi-", "orig": "ground-truth as a tree structure of HTML tags. This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 138.12, "r_x1": 136.72, "r_y1": 138.12, "r_x2": 136.72, "r_y2": 129.22, "r_x3": 50.11, "r_y3": 129.22, "coord_origin": "TOPLEFT" }, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:" }, { "label": "formula", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "formula", "bbox": { "l": 86.22, "t": 150.32, "r": 286.36, "b": 172.74, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.22, "r_y0": 165.9, "r_x1": 118.88, "r_y1": 165.9, "r_x2": 118.88, "r_y2": 157.06, "r_x3": 86.22, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "TEDS (", "orig": "TEDS (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 118.87, "r_y0": 165.9, "r_x1": 143.27, "r_y1": 165.9, "r_x2": 143.27, "r_y2": 157.06, "r_x3": 118.87, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.77, "r_y0": 165.9, "r_x1": 165.9, "r_y1": 165.9, "r_x2": 165.9, "r_y2": 157.06, "r_x3": 143.77, "r_y3": 157.06, "coord_origin": "TOPLEFT" }, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.12, "r_y0": 165.9, "r_x1": 175.87, "r_y1": 165.9, "r_x2": 175.87, "r_y2": 156.5, "r_x3": 168.12, "r_y3": 156.5, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.28, "r_y0": 159.16, "r_x1": 221.96, "r_y1": 159.16, "r_x2": 221.96, "r_y2": 150.32, "r_x3": 179.28, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.95, "r_y0": 159.16, "r_x1": 246.35, "r_y1": 159.16, "r_x2": 246.35, "r_y2": 150.32, "r_x3": 221.95, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$, T$_{b}$", "orig": "T$_{a}$, T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.84, "r_y0": 159.16, "r_x1": 250.72, "r_y1": 159.16, "r_x2": 250.72, "r_y2": 150.32, "r_x3": 246.84, "r_y3": 150.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.21, "r_y0": 172.74, "r_x1": 206.29, "r_y1": 172.74, "r_x2": 206.29, "r_y2": 163.89, "r_x3": 182.21, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "max (", "orig": "max (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.29, "r_y0": 172.74, "r_x1": 209.06, "r_y1": 172.74, "r_x2": 209.06, "r_y2": 163.33, "r_x3": 206.29, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.06, "r_y0": 172.74, "r_x1": 219.2, "r_y1": 172.74, "r_x2": 219.2, "r_y2": 163.89, "r_x3": 209.06, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.7, "r_y0": 172.74, "r_x1": 222.46, "r_y1": 172.74, "r_x2": 222.46, "r_y2": 163.33, "r_x3": 219.7, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.12, "r_y0": 172.74, "r_x1": 226.89, "r_y1": 172.74, "r_x2": 226.89, "r_y2": 163.89, "r_x3": 224.12, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 228.55, "r_y0": 172.74, "r_x1": 231.32, "r_y1": 172.74, "r_x2": 231.32, "r_y2": 163.33, "r_x3": 228.55, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.32, "r_y0": 172.74, "r_x1": 240.65, "r_y1": 172.74, "r_x2": 240.65, "r_y2": 163.89, "r_x3": 231.32, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.14, "r_y0": 172.74, "r_x1": 243.91, "r_y1": 172.74, "r_x2": 243.91, "r_y2": 163.33, "r_x3": 241.14, "r_y3": 163.33, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.91, "r_y0": 172.74, "r_x1": 247.79, "r_y1": 172.74, "r_x2": 247.79, "r_y2": 163.89, "r_x3": 243.91, "r_y3": 163.89, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 166.12, "r_x1": 286.36, "r_y1": 166.12, "r_x2": 286.36, "r_y2": 157.22, "r_x3": 274.75, "r_y3": 157.22, "coord_origin": "TOPLEFT" }, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)" }, { "label": "text", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "text", "bbox": { "l": 50.11, "t": 181.0, "r": 286.36, "b": 213.98, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 190.07, "r_x1": 86.41, "r_y1": 190.07, "r_x2": 86.41, "r_y2": 181.16, "r_x3": 62.07, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.58, "r_y0": 189.85, "r_x1": 98.72, "r_y1": 189.85, "r_x2": 98.72, "r_y2": 181.0, "r_x3": 88.58, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{a}$", "orig": "T$_{a}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.4, "r_y0": 190.07, "r_x1": 115.78, "r_y1": 190.07, "r_x2": 115.78, "r_y2": 181.16, "r_x3": 101.4, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.96, "r_y0": 189.85, "r_x1": 127.29, "r_y1": 189.85, "r_x2": 127.29, "r_y2": 181.0, "r_x3": 117.96, "r_y3": 181.0, "coord_origin": "TOPLEFT" }, "text": "T$_{b}$", "orig": "T$_{b}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.96, "r_y0": 190.07, "r_x1": 286.36, "r_y1": 190.07, "r_x2": 286.36, "r_y2": 181.16, "r_x3": 129.96, "r_y3": 181.16, "coord_origin": "TOPLEFT" }, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 202.02, "r_x1": 252.78, "r_y1": 202.02, "r_x2": 252.78, "r_y2": 193.12, "r_x3": 50.11, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.18, "r_y0": 201.8, "r_x1": 257.95, "r_y1": 201.8, "r_x2": 257.95, "r_y2": 192.4, "r_x3": 255.18, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.95, "r_y0": 201.8, "r_x1": 263.77, "r_y1": 201.8, "r_x2": 263.77, "r_y2": 192.96, "r_x3": 257.95, "r_y3": 192.96, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.15, "r_y0": 201.8, "r_x1": 267.92, "r_y1": 201.8, "r_x2": 267.92, "r_y2": 192.4, "r_x3": 265.15, "r_y3": 192.4, "coord_origin": "TOPLEFT" }, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.32, "r_y0": 202.02, "r_x1": 286.36, "r_y1": 202.02, "r_x2": 286.36, "r_y2": 193.12, "r_x3": 270.32, "r_y3": 193.12, "coord_origin": "TOPLEFT" }, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 213.98, "r_x1": 172.13, "r_y1": 213.98, "r_x2": 172.13, "r_y2": 205.07, "r_x3": 50.11, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 174.62, "r_y0": 213.76, "r_x1": 180.45, "r_y1": 213.76, "r_x2": 180.45, "r_y2": 204.91, "r_x3": 174.62, "r_y3": 204.91, "coord_origin": "TOPLEFT" }, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.83, "r_y0": 213.98, "r_x1": 184.32, "r_y1": 213.98, "r_x2": 184.32, "r_y2": 205.07, "r_x3": 181.83, "r_y3": 205.07, "coord_origin": "TOPLEFT" }, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ." }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 50.11, "t": 224.82, "r": 170.45, "b": 234.67, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 234.67, "r_x1": 64.55, "r_y1": 234.67, "r_x2": 64.55, "r_y2": 224.82, "r_x3": 50.11, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "5.4.", "orig": "5.4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.18, "r_y0": 234.67, "r_x1": 170.45, "r_y1": 234.67, "r_x2": 170.45, "r_y2": 224.82, "r_x3": 74.18, "r_y3": 224.82, "coord_origin": "TOPLEFT" }, "text": "Quantitative Analysis", "orig": "Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.4. Quantitative Analysis" }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 243.65, "r": 286.37, "b": 396.14, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 252.61, "r_x1": 105.32, "r_y1": 252.61, "r_x2": 105.32, "r_y2": 243.65, "r_x3": 62.07, "r_y3": 243.65, "coord_origin": "TOPLEFT" }, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.13, "r_y0": 252.68, "r_x1": 184.68, "r_y1": 252.68, "r_x2": 184.68, "r_y2": 243.77, "r_x3": 112.13, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 191.48, "r_y0": 252.68, "r_x1": 286.36, "r_y1": 252.68, "r_x2": 286.36, "r_y2": 243.77, "r_x3": 191.48, "r_y3": 243.77, "coord_origin": "TOPLEFT" }, "text": "2, TableFormer outper-", "orig": "2, TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 264.63, "r_x1": 286.37, "r_y1": 264.63, "r_x2": 286.37, "r_y2": 255.72, "r_x3": 50.11, "r_y3": 255.72, "coord_origin": "TOPLEFT" }, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 276.59, "r_x1": 286.37, "r_y1": 276.59, "r_x2": 286.37, "r_y2": 267.68, "r_x3": 50.11, "r_y3": 267.68, "coord_origin": "TOPLEFT" }, "text": "margin for predicting the table structure from an image.", "orig": "margin for predicting the table structure from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 288.54, "r_x1": 286.37, "r_y1": 288.54, "r_x2": 286.37, "r_y2": 279.63, "r_x3": 50.11, "r_y3": 279.63, "coord_origin": "TOPLEFT" }, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.5, "r_x1": 286.37, "r_y1": 300.5, "r_x2": 286.37, "r_y2": 291.59, "r_x3": 50.11, "r_y3": 291.59, "coord_origin": "TOPLEFT" }, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.45, "r_x1": 286.37, "r_y1": 312.45, "r_x2": 286.37, "r_y2": 303.55, "r_x3": 50.11, "r_y3": 303.55, "coord_origin": "TOPLEFT" }, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 324.41, "r_x1": 286.37, "r_y1": 324.41, "r_x2": 286.37, "r_y2": 315.5, "r_x3": 50.11, "r_y3": 315.5, "coord_origin": "TOPLEFT" }, "text": "dataset. It has been observed that large tables (e.g. tables", "orig": "dataset. It has been observed that large tables (e.g. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 336.36, "r_x1": 286.37, "r_y1": 336.36, "r_x2": 286.37, "r_y2": 327.46, "r_x3": 50.11, "r_y3": 327.46, "coord_origin": "TOPLEFT" }, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 348.32, "r_x1": 286.37, "r_y1": 348.32, "r_x2": 286.37, "r_y2": 339.41, "r_x3": 50.11, "r_y3": 339.41, "coord_origin": "TOPLEFT" }, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 360.27, "r_x1": 286.37, "r_y1": 360.27, "r_x2": 286.37, "r_y2": 351.37, "r_x3": 50.11, "r_y3": 351.37, "coord_origin": "TOPLEFT" }, "text": "processing step, that produces downsampled images with", "orig": "processing step, that produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 372.23, "r_x1": 286.37, "r_y1": 372.23, "r_x2": 286.37, "r_y2": 363.32, "r_x3": 50.11, "r_y3": 363.32, "coord_origin": "TOPLEFT" }, "text": "indistinguishable features. This problem can be addressed", "orig": "indistinguishable features. This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 384.18, "r_x1": 286.37, "r_y1": 384.18, "r_x2": 286.37, "r_y2": 375.28, "r_x3": 50.11, "r_y3": 375.28, "coord_origin": "TOPLEFT" }, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 396.14, "r_x1": 170.01, "r_y1": 396.14, "r_x2": 170.01, "r_y2": 387.23, "r_x3": 50.11, "r_y3": 387.23, "coord_origin": "TOPLEFT" }, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size." }, { "label": "table", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "table", "bbox": { "l": 53.37, "t": 409.14, "r": 283.04, "b": 582.4, "coord_origin": "TOPLEFT" }, "confidence": 0.989, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 27, "label": "text", "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.84, "r_y0": 429.6, "r_x1": 104.86, "r_y1": 429.6, "r_x2": 104.86, "r_y2": 420.69, "r_x3": 78.84, "r_y3": 420.69, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.2, "r_y0": 423.62, "r_x1": 236.11, "r_y1": 423.62, "r_x2": 236.11, "r_y2": 414.71, "r_x3": 211.2, "r_y3": 414.71, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 129.34, "r_y0": 435.57, "r_x1": 159.22, "r_y1": 435.57, "r_x2": 159.22, "r_y2": 426.67, "r_x3": 129.34, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.17, "r_y0": 435.57, "r_x1": 199.4, "r_y1": 435.57, "r_x2": 199.4, "r_y2": 426.67, "r_x3": 171.17, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 211.36, "t": 426.67, "r": 247.74, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.36, "r_y0": 435.57, "r_x1": 247.74, "r_y1": 435.57, "r_x2": 247.74, "r_y2": 426.67, "r_x3": 211.36, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.54, "r_y0": 435.57, "r_x1": 277.27, "r_y1": 435.57, "r_x2": 277.27, "r_y2": 426.67, "r_x3": 264.54, "r_y3": 426.67, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 452.53, "r_x1": 102.09, "r_y1": 452.53, "r_x2": 102.09, "r_y2": 443.62, "r_x3": 81.61, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 452.53, "r_x1": 153.69, "r_y1": 452.53, "r_x2": 153.69, "r_y2": 443.62, "r_x3": 134.87, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 452.53, "r_x1": 194.0, "r_y1": 452.53, "r_x2": 194.0, "r_y2": 443.62, "r_x3": 176.57, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 452.53, "r_x1": 238.26, "r_y1": 452.53, "r_x2": 238.26, "r_y2": 443.62, "r_x3": 220.83, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 452.53, "r_x1": 279.62, "r_y1": 452.53, "r_x2": 279.62, "r_y2": 443.62, "r_x3": 262.18, "r_y3": 443.62, "coord_origin": "TOPLEFT" }, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 464.49, "r_x1": 101.53, "r_y1": 464.49, "r_x2": 101.53, "r_y2": 455.58, "r_x3": 82.17, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 464.49, "r_x1": 153.69, "r_y1": 464.49, "r_x2": 153.69, "r_y2": 455.58, "r_x3": 134.87, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 464.49, "r_x1": 186.94, "r_y1": 464.49, "r_x2": 186.94, "r_y2": 455.58, "r_x3": 183.62, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 464.49, "r_x1": 231.21, "r_y1": 464.49, "r_x2": 231.21, "r_y2": 455.58, "r_x3": 227.89, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 464.49, "r_x1": 282.11, "r_y1": 464.49, "r_x2": 282.11, "r_y2": 455.58, "r_x3": 259.7, "r_y3": 455.58, "coord_origin": "TOPLEFT" }, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 477.04, "r_x1": 117.38, "r_y1": 477.04, "r_x2": 117.38, "r_y2": 468.13, "r_x3": 66.32, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 477.04, "r_x1": 153.69, "r_y1": 477.04, "r_x2": 153.69, "r_y2": 468.13, "r_x3": 134.87, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 477.04, "r_x1": 194.01, "r_y1": 477.04, "r_x2": 194.01, "r_y2": 468.13, "r_x3": 176.57, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 477.04, "r_x1": 238.27, "r_y1": 477.04, "r_x2": 238.27, "r_y2": 468.13, "r_x3": 220.83, "r_y3": 468.13, "coord_origin": "TOPLEFT" }, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 476.97, "r_x1": 282.11, "r_y1": 476.97, "r_x2": 282.11, "r_y2": 468.01, "r_x3": 259.7, "r_y3": 468.01, "coord_origin": "TOPLEFT" }, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 492.23, "r_x1": 102.09, "r_y1": 492.23, "r_x2": 102.09, "r_y2": 483.33, "r_x3": 81.61, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 492.23, "r_x1": 153.69, "r_y1": 492.23, "r_x2": 153.69, "r_y2": 483.33, "r_x3": 134.87, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 492.23, "r_x1": 194.0, "r_y1": 492.23, "r_x2": 194.0, "r_y2": 483.33, "r_x3": 176.57, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.34, "r_y0": 492.23, "r_x1": 240.75, "r_y1": 492.23, "r_x2": 240.75, "r_y2": 483.33, "r_x3": 218.34, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 492.23, "r_x1": 279.62, "r_y1": 492.23, "r_x2": 279.62, "r_y2": 483.33, "r_x3": 262.18, "r_y3": 483.33, "coord_origin": "TOPLEFT" }, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.17, "r_y0": 504.19, "r_x1": 101.53, "r_y1": 504.19, "r_x2": 101.53, "r_y2": 495.28, "r_x3": 82.17, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 504.19, "r_x1": 153.69, "r_y1": 504.19, "r_x2": 153.69, "r_y2": 495.28, "r_x3": 134.87, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.62, "r_y0": 504.19, "r_x1": 186.94, "r_y1": 504.19, "r_x2": 186.94, "r_y2": 495.28, "r_x3": 183.62, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 504.19, "r_x1": 231.21, "r_y1": 504.19, "r_x2": 231.21, "r_y2": 495.28, "r_x3": 227.89, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.7, "r_y0": 504.19, "r_x1": 282.11, "r_y1": 504.19, "r_x2": 282.11, "r_y2": 495.28, "r_x3": 259.7, "r_y3": 495.28, "coord_origin": "TOPLEFT" }, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.79, "r_y0": 516.14, "r_x1": 111.91, "r_y1": 516.14, "r_x2": 111.91, "r_y2": 507.24, "r_x3": 71.79, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.86, "r_y0": 516.14, "r_x1": 153.68, "r_y1": 516.14, "r_x2": 153.68, "r_y2": 507.24, "r_x3": 134.86, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.63, "r_y0": 516.14, "r_x1": 186.95, "r_y1": 516.14, "r_x2": 186.95, "r_y2": 507.24, "r_x3": 183.63, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 516.14, "r_x1": 231.21, "r_y1": 516.14, "r_x2": 231.21, "r_y2": 507.24, "r_x3": 227.89, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.69, "r_y0": 516.14, "r_x1": 282.11, "r_y1": 516.14, "r_x2": 282.11, "r_y2": 507.24, "r_x3": 259.69, "r_y3": 507.24, "coord_origin": "TOPLEFT" }, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 528.1, "r_x1": 117.38, "r_y1": 528.1, "r_x2": 117.38, "r_y2": 519.19, "r_x3": 66.32, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 528.1, "r_x1": 153.69, "r_y1": 528.1, "r_x2": 153.69, "r_y2": 519.19, "r_x3": 134.87, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 528.1, "r_x1": 194.01, "r_y1": 528.1, "r_x2": 194.01, "r_y2": 519.19, "r_x3": 176.57, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 528.1, "r_x1": 238.27, "r_y1": 528.1, "r_x2": 238.27, "r_y2": 519.19, "r_x3": 220.83, "r_y3": 519.19, "coord_origin": "TOPLEFT" }, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 528.03, "r_x1": 279.62, "r_y1": 528.03, "r_x2": 279.62, "r_y2": 519.07, "r_x3": 262.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.61, "r_y0": 545.4, "r_x1": 102.09, "r_y1": 545.4, "r_x2": 102.09, "r_y2": 536.5, "r_x3": 81.61, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 545.4, "r_x1": 150.64, "r_y1": 545.4, "r_x2": 150.64, "r_y2": 536.5, "r_x3": 137.91, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 545.4, "r_x1": 194.0, "r_y1": 545.4, "r_x2": 194.0, "r_y2": 536.5, "r_x3": 176.57, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 545.4, "r_x1": 231.21, "r_y1": 545.4, "r_x2": 231.21, "r_y2": 536.5, "r_x3": 227.89, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.18, "r_y0": 545.4, "r_x1": 279.62, "r_y1": 545.4, "r_x2": 279.62, "r_y2": 536.5, "r_x3": 262.18, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 557.36, "r_x1": 117.38, "r_y1": 557.36, "r_x2": 117.38, "r_y2": 548.45, "r_x3": 66.32, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 137.91, "r_y0": 557.36, "r_x1": 150.64, "r_y1": 557.36, "r_x2": 150.64, "r_y2": 548.45, "r_x3": 137.91, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 557.36, "r_x1": 194.01, "r_y1": 557.36, "r_x2": 194.01, "r_y2": 548.45, "r_x3": 176.57, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.89, "r_y0": 557.36, "r_x1": 231.21, "r_y1": 557.36, "r_x2": 231.21, "r_y2": 548.45, "r_x3": 227.89, "r_y3": 548.45, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 557.29, "r_x1": 279.62, "r_y1": 557.29, "r_x2": 279.62, "r_y2": 548.33, "r_x3": 262.19, "r_y3": 548.33, "coord_origin": "TOPLEFT" }, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.32, "r_y0": 576.91, "r_x1": 117.38, "r_y1": 576.91, "r_x2": 117.38, "r_y2": 568.0, "r_x3": 66.32, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.87, "r_y0": 576.91, "r_x1": 153.69, "r_y1": 576.91, "r_x2": 153.69, "r_y2": 568.0, "r_x3": 134.87, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.57, "r_y0": 576.91, "r_x1": 194.01, "r_y1": 576.91, "r_x2": 194.01, "r_y2": 568.0, "r_x3": 176.57, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.83, "r_y0": 576.91, "r_x1": 238.27, "r_y1": 576.91, "r_x2": 238.27, "r_y2": 568.0, "r_x3": 220.83, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.19, "r_y0": 576.91, "r_x1": 279.62, "r_y1": 576.91, "r_x2": 279.62, "r_y2": 568.0, "r_x3": 262.19, "r_y3": 568.0, "coord_origin": "TOPLEFT" }, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 11, "num_cols": 5, "table_cells": [ { "bbox": { "l": 78.84, "t": 420.69, "r": 104.86, "b": 429.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 211.2, "t": 414.71, "r": 236.11, "b": 423.62, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 129.34, "t": 426.67, "r": 159.22, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 171.17, "t": 426.67, "r": 199.4, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 264.54, "t": 426.67, "r": 277.27, "b": 435.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 443.62, "r": 102.09, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 443.62, "r": 153.69, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 443.62, "r": 194.0, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 443.62, "r": 238.26, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 443.62, "r": 279.62, "b": 452.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 455.58, "r": 101.53, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 455.58, "r": 153.69, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 455.58, "r": 186.94, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 455.58, "r": 231.21, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 455.58, "r": 282.11, "b": 464.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 468.13, "r": 117.38, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 468.13, "r": 153.69, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 468.13, "r": 194.01, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 468.13, "r": 238.27, "b": 477.04, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 468.01, "r": 282.11, "b": 476.97, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 483.33, "r": 102.09, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 483.33, "r": 153.69, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 483.33, "r": 194.0, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 218.34, "t": 483.33, "r": 240.75, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 483.33, "r": 279.62, "b": 492.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 82.17, "t": 495.28, "r": 101.53, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 495.28, "r": 153.69, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.62, "t": 495.28, "r": 186.94, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 495.28, "r": 231.21, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.7, "t": 495.28, "r": 282.11, "b": 504.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 71.79, "t": 507.24, "r": 111.91, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.86, "t": 507.24, "r": 153.68, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 183.63, "t": 507.24, "r": 186.95, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 507.24, "r": 231.21, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 259.69, "t": 507.24, "r": 282.11, "b": 516.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 519.19, "r": 117.38, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 519.19, "r": 153.69, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 519.19, "r": 194.01, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 519.19, "r": 238.27, "b": 528.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 519.07, "r": 279.62, "b": 528.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 81.61, "t": 536.5, "r": 102.09, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 536.5, "r": 150.64, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 536.5, "r": 194.0, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 536.5, "r": 231.21, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.18, "t": 536.5, "r": 279.62, "b": 545.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 548.45, "r": 117.38, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 137.91, "t": 548.45, "r": 150.64, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 548.45, "r": 194.01, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 227.89, "t": 548.45, "r": 231.21, "b": 557.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 548.33, "r": 279.62, "b": 557.29, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 66.32, "t": 568.0, "r": 117.38, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 134.87, "t": 568.0, "r": 153.69, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 176.57, "t": 568.0, "r": 194.01, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 220.83, "t": 568.0, "r": 238.27, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 262.19, "t": 568.0, "r": 279.62, "b": 576.91, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "text", "id": 15, "page_no": 6, "cluster": { "id": 15, "label": "text", "bbox": { "l": 50.11, "t": 592.43, "r": 286.37, "b": 613.29, "coord_origin": "TOPLEFT" }, "confidence": 0.721, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 601.34, "r_x1": 286.37, "r_y1": 601.34, "r_x2": 286.37, "r_y2": 592.43, "r_x3": 50.11, "r_y3": 592.43, "coord_origin": "TOPLEFT" }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 613.29, "r_x1": 247.46, "r_y1": 613.29, "r_x2": 247.46, "r_y2": 604.39, "r_x3": 50.11, "r_y3": 604.39, "coord_origin": "TOPLEFT" }, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)." }, { "label": "text", "id": 16, "page_no": 6, "cluster": { "id": 16, "label": "text", "bbox": { "l": 50.11, "t": 616.34, "r": 261.79, "b": 625.25, "coord_origin": "TOPLEFT" }, "confidence": 0.643, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 625.25, "r_x1": 261.79, "r_y1": 625.25, "r_x2": 261.79, "r_y2": 616.34, "r_x3": 50.11, "r_y3": 616.34, "coord_origin": "TOPLEFT" }, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "FT: Model was trained on PubTabNet then finetuned." }, { "label": "text", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 644.35, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 653.31, "r_x1": 124.72, "r_y1": 653.31, "r_x2": 124.72, "r_y2": 644.35, "r_x3": 62.07, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 128.2, "r_y0": 653.38, "r_x1": 242.93, "r_y1": 653.38, "r_x2": 242.93, "r_y2": 644.47, "r_x3": 128.2, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.55, "r_y0": 653.15, "r_x1": 286.36, "r_y1": 653.15, "r_x2": 286.36, "r_y2": 644.56, "r_x3": 245.55, "r_y3": 644.56, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.1, "r_x1": 84.97, "r_y1": 665.1, "r_x2": 84.97, "r_y2": 656.51, "r_x3": 50.11, "r_y3": 656.51, "coord_origin": "TOPLEFT" }, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.52, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 89.52, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "provides bounding boxes that can be improved", "orig": "provides bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "grid-like structure of tables to refine the predictions. A de-", "orig": "grid-like structure of tables to refine the predictions. A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 286.37, "r_y1": 713.15, "r_x2": 286.37, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "supplementary material. As shown in Tab. 3, we evaluate", "orig": "supplementary material. As shown in Tab. 3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate" }, { "label": "text", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "text", "bbox": { "l": 308.86, "t": 75.21, "r": 545.12, "b": 227.58, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 84.11, "r_x1": 322.14, "r_y1": 84.11, "r_x2": 322.14, "r_y2": 75.21, "r_x3": 308.86, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.45, "r_y0": 83.89, "r_x1": 404.57, "r_y1": 83.89, "r_x2": 404.57, "r_y2": 75.3, "r_x3": 325.45, "r_y3": 75.3, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.1, "r_y0": 84.11, "r_x1": 545.11, "r_y1": 84.11, "r_x2": 545.11, "r_y2": 75.21, "r_x3": 408.1, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 96.07, "r_x1": 545.12, "r_y1": 96.07, "r_x2": 545.12, "r_y2": 87.16, "r_x3": 308.86, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 108.02, "r_x1": 470.23, "r_y1": 108.02, "r_x2": 470.23, "r_y2": 99.12, "r_x3": 308.86, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "for pre-processing and post-processing.", "orig": "for pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 477.53, "r_y0": 108.02, "r_x1": 545.12, "r_y1": 108.02, "r_x2": 545.12, "r_y2": 99.12, "r_x3": 477.53, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 119.98, "r_x1": 545.12, "r_y1": 119.98, "r_x2": 545.12, "r_y2": 111.07, "r_x3": 308.86, "r_y3": 111.07, "coord_origin": "TOPLEFT" }, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 131.93, "r_x1": 545.12, "r_y1": 131.93, "r_x2": 545.12, "r_y2": 123.03, "r_x3": 308.86, "r_y3": 123.03, "coord_origin": "TOPLEFT" }, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 143.89, "r_x1": 502.02, "r_y1": 143.89, "r_x2": 502.02, "r_y2": 134.98, "r_x3": 308.86, "r_y3": 134.98, "coord_origin": "TOPLEFT" }, "text": "posed approach, we\u2019ve integrated TableFormer\u2019s", "orig": "posed approach, we\u2019ve integrated TableFormer\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 504.47, "r_y0": 143.66, "r_x1": 545.11, "r_y1": 143.66, "r_x2": 545.11, "r_y2": 135.07, "r_x3": 504.47, "r_y3": 135.07, "coord_origin": "TOPLEFT" }, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 155.62, "r_x1": 343.16, "r_y1": 155.62, "r_x2": 343.16, "r_y2": 147.03, "r_x3": 308.86, "r_y3": 147.03, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.37, "r_y0": 155.85, "r_x1": 545.11, "r_y1": 155.85, "r_x2": 545.11, "r_y2": 146.94, "r_x3": 346.37, "r_y3": 146.94, "coord_origin": "TOPLEFT" }, "text": "into EDD architecture. As mentioned previously,", "orig": "into EDD architecture. As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 167.8, "r_x1": 446.16, "r_y1": 167.8, "r_x2": 446.16, "r_y2": 158.89, "r_x3": 308.86, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.29, "r_y0": 167.57, "r_x1": 525.04, "r_y1": 167.57, "r_x2": 525.04, "r_y2": 158.98, "r_x3": 448.29, "r_y3": 158.98, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 527.4, "r_y0": 167.8, "r_x1": 545.11, "r_y1": 167.8, "r_x2": 545.11, "r_y2": 158.89, "r_x3": 527.4, "r_y3": 158.89, "coord_origin": "TOPLEFT" }, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 179.76, "r_x1": 545.12, "r_y1": 179.76, "r_x2": 545.12, "r_y2": 170.85, "r_x3": 308.86, "r_y3": 170.85, "coord_origin": "TOPLEFT" }, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 191.71, "r_x1": 432.87, "r_y1": 191.71, "r_x2": 432.87, "r_y2": 182.8, "r_x3": 308.86, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.39, "r_y0": 191.48, "r_x1": 510.93, "r_y1": 191.48, "r_x2": 510.93, "r_y2": 182.89, "r_x3": 436.39, "r_y3": 182.89, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.68, "r_y0": 191.71, "r_x1": 545.11, "r_y1": 191.71, "r_x2": 545.11, "r_y2": 182.8, "r_x3": 514.68, "r_y3": 182.8, "coord_origin": "TOPLEFT" }, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 203.67, "r_x1": 431.17, "r_y1": 203.67, "r_x2": 431.17, "r_y2": 194.76, "r_x3": 308.86, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.68, "r_y0": 203.44, "r_x1": 514.18, "r_y1": 203.44, "r_x2": 514.18, "r_y2": 194.85, "r_x3": 434.68, "r_y3": 194.85, "coord_origin": "TOPLEFT" }, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.18, "r_y0": 203.67, "r_x1": 545.11, "r_y1": 203.67, "r_x2": 545.11, "r_y2": 194.76, "r_x3": 514.18, "r_y3": 194.76, "coord_origin": "TOPLEFT" }, "text": ". If the", "orig": ". If the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 215.39, "r_x1": 382.36, "r_y1": 215.39, "r_x2": 382.36, "r_y2": 206.81, "r_x3": 308.86, "r_y3": 206.81, "coord_origin": "TOPLEFT" }, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.08, "r_y0": 215.62, "r_x1": 545.11, "r_y1": 215.62, "r_x2": 545.11, "r_y2": 206.72, "r_x3": 385.08, "r_y3": 206.72, "coord_origin": "TOPLEFT" }, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 227.58, "r_x1": 501.7, "r_y1": 227.58, "r_x2": 501.7, "r_y2": 218.67, "r_x3": 308.86, "r_y3": 218.67, "coord_origin": "TOPLEFT" }, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes." }, { "label": "table", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "table", "bbox": { "l": 308.41, "t": 247.88, "r": 533.64, "b": 303.81, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 83, "label": "text", "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.32, "r_y0": 262.57, "r_x1": 365.34, "r_y1": 262.57, "r_x2": 365.34, "r_y2": 253.66, "r_x3": 339.32, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 401.04, "r_y0": 262.57, "r_x1": 430.92, "r_y1": 262.57, "r_x2": 430.92, "r_y2": 253.66, "r_x3": 401.04, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.1, "r_y0": 262.57, "r_x1": 474.59, "r_y1": 262.57, "r_x2": 474.59, "r_y2": 253.66, "r_x3": 454.1, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 486.54, "r_y0": 262.57, "r_x1": 527.23, "r_y1": 262.57, "r_x2": 527.23, "r_y2": 253.66, "r_x3": 486.54, "r_y3": 253.66, "coord_origin": "TOPLEFT" }, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.66, "r_y0": 279.53, "r_x1": 377.0, "r_y1": 279.53, "r_x2": 377.0, "r_y2": 270.62, "r_x3": 327.66, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.7, "r_y0": 279.53, "r_x1": 438.28, "r_y1": 279.53, "r_x2": 438.28, "r_y2": 270.62, "r_x3": 393.7, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.64, "r_y0": 279.53, "r_x1": 473.07, "r_y1": 279.53, "r_x2": 473.07, "r_y2": 270.62, "r_x3": 455.64, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 279.53, "r_x1": 515.6, "r_y1": 279.53, "r_x2": 515.6, "r_y2": 270.62, "r_x3": 498.17, "r_y3": 270.62, "coord_origin": "TOPLEFT" }, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 291.48, "r_x1": 377.86, "r_y1": 291.48, "r_x2": 377.86, "r_y2": 282.58, "r_x3": 326.8, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.69, "r_y0": 291.48, "r_x1": 438.28, "r_y1": 291.48, "r_x2": 438.28, "r_y2": 282.58, "r_x3": 393.69, "r_y3": 282.58, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 291.41, "r_x1": 473.07, "r_y1": 291.41, "r_x2": 473.07, "r_y2": 282.46, "r_x3": 455.63, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 498.17, "r_y0": 291.41, "r_x1": 515.61, "r_y1": 291.41, "r_x2": 515.61, "r_y2": 282.46, "r_x3": 498.17, "r_y3": 282.46, "coord_origin": "TOPLEFT" }, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 303.44, "r_x1": 377.86, "r_y1": 303.44, "r_x2": 377.86, "r_y2": 294.53, "r_x3": 326.8, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 389.82, "r_y0": 303.44, "r_x1": 442.15, "r_y1": 303.44, "r_x2": 442.15, "r_y2": 294.53, "r_x3": 389.82, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.63, "r_y0": 303.44, "r_x1": 473.07, "r_y1": 303.44, "r_x2": 473.07, "r_y2": 294.53, "r_x3": 455.63, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 505.23, "r_y0": 303.44, "r_x1": 508.54, "r_y1": 303.44, "r_x2": 508.54, "r_y2": 294.53, "r_x3": 505.23, "r_y3": 294.53, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 4, "num_cols": 4, "table_cells": [ { "bbox": { "l": 339.32, "t": 253.66, "r": 365.34, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 401.04, "t": 253.66, "r": 430.92, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 454.1, "t": 253.66, "r": 474.59, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 486.54, "t": 253.66, "r": 527.23, "b": 262.57, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 327.66, "t": 270.62, "r": 377.0, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.7, "t": 270.62, "r": 438.28, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.64, "t": 270.62, "r": 473.07, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 270.62, "r": 515.6, "b": 279.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 282.58, "r": 377.86, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 393.69, "t": 282.58, "r": 438.28, "b": 291.48, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 282.46, "r": 473.07, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 498.17, "t": 282.46, "r": 515.61, "b": 291.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.8, "t": 294.53, "r": 377.86, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 389.82, "t": 294.53, "r": 442.15, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 455.63, "t": 294.53, "r": 473.07, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 505.23, "t": 294.53, "r": 508.54, "b": 303.44, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "caption", "bbox": { "l": 308.86, "t": 316.45, "r": 545.12, "b": 337.31, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 325.36, "r_x1": 341.5, "r_y1": 325.36, "r_x2": 341.5, "r_y2": 316.45, "r_x3": 308.86, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 348.6, "r_y0": 325.36, "r_x1": 545.12, "r_y1": 325.36, "r_x2": 545.12, "r_y2": 316.45, "r_x3": 348.6, "r_y3": 316.45, "coord_origin": "TOPLEFT" }, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.31, "r_x1": 474.98, "r_y1": 337.31, "r_x2": 474.98, "r_y2": 328.4, "r_x3": 308.86, "r_y3": 328.4, "coord_origin": "TOPLEFT" }, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing." }, { "label": "text", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "text", "bbox": { "l": 308.86, "t": 367.68, "r": 545.12, "b": 520.17, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 376.64, "r_x1": 378.95, "r_y1": 376.64, "r_x2": 378.95, "r_y2": 367.68, "r_x3": 320.82, "r_y3": 367.68, "coord_origin": "TOPLEFT" }, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.08, "r_y0": 376.71, "r_x1": 545.12, "r_y1": 376.71, "r_x2": 545.12, "r_y2": 367.8, "r_x3": 387.08, "r_y3": 367.8, "coord_origin": "TOPLEFT" }, "text": "In this section, we evaluate the entire", "orig": "In this section, we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 388.66, "r_x1": 487.19, "r_y1": 388.66, "r_x2": 487.19, "r_y2": 379.75, "r_x3": 308.86, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.97, "r_y0": 388.66, "r_x1": 545.12, "r_y1": 388.66, "r_x2": 545.12, "r_y2": 379.75, "r_x3": 493.97, "r_y3": 379.75, "coord_origin": "TOPLEFT" }, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.62, "r_x1": 545.12, "r_y1": 400.62, "r_x2": 545.12, "r_y2": 391.71, "r_x3": 308.86, "r_y3": 391.71, "coord_origin": "TOPLEFT" }, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.57, "r_x1": 545.12, "r_y1": 412.57, "r_x2": 545.12, "r_y2": 403.67, "r_x3": 308.86, "r_y3": 403.67, "coord_origin": "TOPLEFT" }, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.53, "r_x1": 314.08, "r_y1": 424.53, "r_x2": 314.08, "r_y2": 415.62, "r_x3": 308.86, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.69, "r_y0": 424.53, "r_x1": 545.12, "r_y1": 424.53, "r_x2": 545.12, "r_y2": 415.62, "r_x3": 316.69, "r_y3": 415.62, "coord_origin": "TOPLEFT" }, "text": "shows the TEDs score of HTML code representing the", "orig": "shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.48, "r_x1": 545.12, "r_y1": 436.48, "r_x2": 545.12, "r_y2": 427.58, "r_x3": 308.86, "r_y3": 427.58, "coord_origin": "TOPLEFT" }, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.44, "r_x1": 545.12, "r_y1": 448.44, "r_x2": 545.12, "r_y2": 439.53, "r_x3": 308.86, "r_y3": 439.53, "coord_origin": "TOPLEFT" }, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 460.39, "r_x1": 350.24, "r_y1": 460.39, "r_x2": 350.24, "r_y2": 451.49, "r_x3": 308.86, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.18, "r_y0": 460.32, "r_x1": 374.59, "r_y1": 460.32, "r_x2": 374.59, "r_y2": 451.37, "r_x3": 352.18, "r_y3": 451.37, "coord_origin": "TOPLEFT" }, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.53, "r_y0": 460.39, "r_x1": 545.11, "r_y1": 460.39, "r_x2": 545.11, "r_y2": 451.49, "r_x3": 376.53, "r_y3": 451.49, "coord_origin": "TOPLEFT" }, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 472.35, "r_x1": 545.12, "r_y1": 472.35, "r_x2": 545.12, "r_y2": 463.44, "r_x3": 308.86, "r_y3": 463.44, "coord_origin": "TOPLEFT" }, "text": "mercial solutions. We believe our scores would be higher", "orig": "mercial solutions. We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.3, "r_x1": 545.12, "r_y1": 484.3, "r_x2": 545.12, "r_y2": 475.4, "r_x3": 308.86, "r_y3": 475.4, "coord_origin": "TOPLEFT" }, "text": "if the HTML ground-truth matched the extracted PDF cell", "orig": "if the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.26, "r_x1": 545.12, "r_y1": 496.26, "r_x2": 545.12, "r_y2": 487.35, "r_x3": 308.86, "r_y3": 487.35, "coord_origin": "TOPLEFT" }, "text": "content. Unfortunately, there are small discrepancies such", "orig": "content. Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.21, "r_x1": 545.12, "r_y1": 508.21, "r_x2": 545.12, "r_y2": 499.31, "r_x3": 308.86, "r_y3": 499.31, "coord_origin": "TOPLEFT" }, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.17, "r_x1": 405.7, "r_y1": 520.17, "r_x2": 405.7, "r_y2": 511.26, "r_x3": 308.86, "r_y3": 511.26, "coord_origin": "TOPLEFT" }, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations." }, { "label": "table", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "table", "bbox": { "l": 332.97, "t": 540.28, "r": 520.94, "b": 643.27, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 99, "label": "text", "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 358.01, "r_y0": 561.14, "r_x1": 384.02, "r_y1": 561.14, "r_x2": 384.02, "r_y2": 552.23, "r_x3": 358.01, "r_y3": 552.23, "coord_origin": "TOPLEFT" }, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 449.03, "r_y0": 555.16, "r_x1": 473.94, "r_y1": 555.16, "r_x2": 473.94, "r_y2": 546.26, "r_x3": 449.03, "r_y3": 546.26, "coord_origin": "TOPLEFT" }, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.51, "r_y0": 567.12, "r_x1": 436.74, "r_y1": 567.12, "r_x2": 436.74, "r_y2": 558.21, "r_x3": 408.51, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 448.7, "t": 558.21, "r": 485.08, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.7, "r_y0": 567.12, "r_x1": 485.08, "r_y1": 567.12, "r_x2": 485.08, "r_y2": 558.21, "r_x3": 448.7, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 499.38, "r_y0": 567.12, "r_x1": 512.12, "r_y1": 567.12, "r_x2": 512.12, "r_y2": 558.21, "r_x3": 499.38, "r_y3": 558.21, "coord_origin": "TOPLEFT" }, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.68, "r_y0": 584.07, "r_x1": 384.35, "r_y1": 584.07, "r_x2": 384.35, "r_y2": 575.17, "r_x3": 357.68, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 584.07, "r_x1": 431.34, "r_y1": 584.07, "r_x2": 431.34, "r_y2": 575.17, "r_x3": 413.9, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.16, "r_y0": 584.07, "r_x1": 475.6, "r_y1": 584.07, "r_x2": 475.6, "r_y2": 575.17, "r_x3": 458.16, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 584.07, "r_x1": 514.46, "r_y1": 584.07, "r_x2": 514.46, "r_y2": 575.17, "r_x3": 497.03, "r_y3": 575.17, "coord_origin": "TOPLEFT" }, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 350.72, "r_y0": 596.03, "r_x1": 391.31, "r_y1": 596.03, "r_x2": 391.31, "r_y2": 587.12, "r_x3": 350.72, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 596.03, "r_x1": 431.34, "r_y1": 596.03, "r_x2": 431.34, "r_y2": 587.12, "r_x3": 413.91, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 596.03, "r_x1": 475.6, "r_y1": 596.03, "r_x2": 475.6, "r_y2": 587.12, "r_x3": 458.17, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 596.03, "r_x1": 514.47, "r_y1": 596.03, "r_x2": 514.47, "r_y2": 587.12, "r_x3": 497.03, "r_y3": 587.12, "coord_origin": "TOPLEFT" }, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 354.14, "r_y0": 607.98, "r_x1": 387.9, "r_y1": 607.98, "r_x2": 387.9, "r_y2": 599.08, "r_x3": 354.14, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 607.98, "r_x1": 431.34, "r_y1": 607.98, "r_x2": 431.34, "r_y2": 599.08, "r_x3": 413.9, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 607.98, "r_x1": 475.6, "r_y1": 607.98, "r_x2": 475.6, "r_y2": 599.08, "r_x3": 458.17, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 607.98, "r_x1": 514.46, "r_y1": 607.98, "r_x2": 514.46, "r_y2": 599.08, "r_x3": 497.03, "r_y3": 599.08, "coord_origin": "TOPLEFT" }, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.56, "r_y0": 619.94, "r_x1": 395.48, "r_y1": 619.94, "r_x2": 395.48, "r_y2": 611.03, "r_x3": 346.56, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 619.94, "r_x1": 431.34, "r_y1": 619.94, "r_x2": 431.34, "r_y2": 611.03, "r_x3": 413.91, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 619.94, "r_x1": 475.6, "r_y1": 619.94, "r_x2": 475.6, "r_y2": 611.03, "r_x3": 458.17, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 619.94, "r_x1": 514.47, "r_y1": 619.94, "r_x2": 514.47, "r_y2": 611.03, "r_x3": 497.03, "r_y3": 611.03, "coord_origin": "TOPLEFT" }, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.78, "r_y0": 631.89, "r_x1": 381.25, "r_y1": 631.89, "r_x2": 381.25, "r_y2": 622.99, "r_x3": 360.78, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.9, "r_y0": 631.89, "r_x1": 431.34, "r_y1": 631.89, "r_x2": 431.34, "r_y2": 622.99, "r_x3": 413.9, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 631.89, "r_x1": 475.6, "r_y1": 631.89, "r_x2": 475.6, "r_y2": 622.99, "r_x3": 458.17, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 631.89, "r_x1": 514.46, "r_y1": 631.89, "r_x2": 514.46, "r_y2": 622.99, "r_x3": 497.03, "r_y3": 622.99, "coord_origin": "TOPLEFT" }, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.48, "r_y0": 643.85, "r_x1": 396.55, "r_y1": 643.85, "r_x2": 396.55, "r_y2": 634.94, "r_x3": 345.48, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 413.91, "r_y0": 643.85, "r_x1": 431.34, "r_y1": 643.85, "r_x2": 431.34, "r_y2": 634.94, "r_x3": 413.91, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 458.17, "r_y0": 643.85, "r_x1": 475.6, "r_y1": 643.85, "r_x2": 475.6, "r_y2": 634.94, "r_x3": 458.17, "r_y3": 634.94, "coord_origin": "TOPLEFT" }, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 497.03, "r_y0": 643.78, "r_x1": 514.47, "r_y1": 643.78, "r_x2": 514.47, "r_y2": 634.82, "r_x3": 497.03, "r_y3": 634.82, "coord_origin": "TOPLEFT" }, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 4, "table_cells": [ { "bbox": { "l": 358.01, "t": 552.23, "r": 384.02, "b": 561.14, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 449.03, "t": 546.26, "r": 473.94, "b": 555.16, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 408.51, "t": 558.21, "r": 436.74, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 499.38, "t": 558.21, "r": 512.12, "b": 567.12, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 357.68, "t": 575.17, "r": 384.35, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 575.17, "r": 431.34, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.16, "t": 575.17, "r": 475.6, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 575.17, "r": 514.46, "b": 584.07, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 350.72, "t": 587.12, "r": 391.31, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 587.12, "r": 431.34, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 587.12, "r": 475.6, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 587.12, "r": 514.47, "b": 596.03, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 354.14, "t": 599.08, "r": 387.9, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 599.08, "r": 431.34, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 599.08, "r": 475.6, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 599.08, "r": 514.46, "b": 607.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 346.56, "t": 611.03, "r": 395.48, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 611.03, "r": 431.34, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 611.03, "r": 475.6, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 611.03, "r": 514.47, "b": 619.94, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 360.78, "t": 622.99, "r": 381.25, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.9, "t": 622.99, "r": 431.34, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 622.99, "r": 475.6, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 622.99, "r": 514.46, "b": 631.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 345.48, "t": 634.94, "r": 396.55, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 413.91, "t": 634.94, "r": 431.34, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 458.17, "t": 634.94, "r": 475.6, "b": 643.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 497.03, "t": 634.82, "r": 514.47, "b": 643.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 656.86, "r": 545.12, "b": 689.68, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 665.77, "r_x1": 341.74, "r_y1": 665.77, "r_x2": 341.74, "r_y2": 656.86, "r_x3": 308.86, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 349.56, "r_y0": 665.77, "r_x1": 545.12, "r_y1": 665.77, "r_x2": 545.12, "r_y2": 656.86, "r_x3": 349.56, "r_y3": 656.86, "coord_origin": "TOPLEFT" }, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 677.72, "r_x1": 545.12, "r_y1": 677.72, "r_x2": 545.12, "r_y2": 668.82, "r_x3": 308.86, "r_y3": 668.82, "coord_origin": "TOPLEFT" }, "text": "cell detection on PubTabNet. In all cases the input is PDF", "orig": "cell detection on PubTabNet. In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 689.68, "r_x1": 435.04, "r_y1": 689.68, "r_x2": 435.04, "r_y2": 680.77, "r_x3": 308.86, "r_y3": 680.77, "coord_origin": "TOPLEFT" }, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables." } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.879, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ] } }, { "page_no": 7, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 216.11, "r_x1": 62.22, "r_y1": 216.11, "r_x2": 62.22, "r_y2": 208.23, "r_x3": 53.81, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.42, "r_y0": 216.11, "r_x1": 385.93, "r_y1": 216.11, "r_x2": 385.93, "r_y2": 208.23, "r_x3": 66.42, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 102.15, "r_x1": 284.35, "r_y1": 102.15, "r_x2": 284.35, "r_y2": 94.28, "r_x3": 53.81, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83, "r_y0": 102.15, "r_x1": 431.09, "r_y1": 102.15, "r_x2": 431.09, "r_y2": 94.28, "r_x3": 304.83, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.29, "r_y0": 86.56, "r_x1": 61.55, "r_y1": 86.56, "r_x2": 61.55, "r_y2": 78.69, "r_x3": 53.29, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.68, "r_y0": 86.56, "r_x1": 499.56, "r_y1": 86.56, "r_x2": 499.56, "r_y2": 78.69, "r_x3": 65.68, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.43, "r_y0": 298.6, "r_x1": 549.42, "r_y1": 298.6, "r_x2": 549.42, "r_y2": 292.3, "r_x3": 380.43, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 329.78, "r_x1": 86.86, "r_y1": 329.78, "r_x2": 86.86, "r_y2": 320.88, "r_x3": 50.11, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.92, "r_y0": 329.78, "r_x1": 545.11, "r_y1": 329.78, "r_x2": 545.11, "r_y2": 320.88, "r_x3": 93.92, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 341.74, "r_x1": 545.11, "r_y1": 341.74, "r_x2": 545.11, "r_y2": 332.83, "r_x3": 50.11, "r_y3": 332.83, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 353.69, "r_x1": 545.11, "r_y1": 353.69, "r_x2": 545.11, "r_y2": 344.79, "r_x3": 50.11, "r_y3": 344.79, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.65, "r_x1": 139.8, "r_y1": 365.65, "r_x2": 139.8, "r_y2": 356.74, "r_x3": 50.11, "r_y3": 356.74, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.6, "r_y0": 467.63, "r_x1": 532.63, "r_y1": 467.63, "r_x2": 532.63, "r_y2": 458.73, "r_x3": 62.6, "r_y3": 458.73, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.25, "r_x1": 64.45, "r_y1": 501.25, "r_x2": 64.45, "r_y2": 491.4, "r_x3": 50.11, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.01, "r_y0": 501.25, "r_x1": 163.76, "r_y1": 501.25, "r_x2": 163.76, "r_y2": 491.4, "r_x3": 74.01, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 545.78, "r_x1": 286.36, "r_y1": 545.78, "r_x2": 286.36, "r_y2": 536.87, "r_x3": 62.07, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 557.73, "r_x1": 211.16, "r_y1": 557.73, "r_x2": 211.16, "r_y2": 548.83, "r_x3": 50.11, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.1, "r_y0": 557.51, "r_x1": 259.17, "r_y1": 557.51, "r_x2": 259.17, "r_y2": 548.92, "r_x3": 215.1, "r_y3": 548.92, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73, "r_x1": 286.36, "r_y1": 557.73, "r_x2": 286.36, "r_y2": 548.83, "r_x3": 263.12, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 569.69, "r_x1": 286.37, "r_y1": 569.69, "r_x2": 286.37, "r_y2": 560.78, "r_x3": 50.11, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 226.89, "r_y1": 713.15, "r_x2": 226.89, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 501.46, "r_x1": 316.07, "r_y1": 501.46, "r_x2": 316.07, "r_y2": 490.71, "r_x3": 308.86, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.69, "r_y0": 501.46, "r_x1": 460.85, "r_y1": 501.46, "r_x2": 460.85, "r_y2": 490.71, "r_x3": 325.69, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 521.8, "r_x1": 545.12, "r_y1": 521.8, "r_x2": 545.12, "r_y2": 512.89, "r_x3": 320.82, "r_y3": 512.89, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.75, "r_x1": 545.12, "r_y1": 533.75, "r_x2": 545.12, "r_y2": 524.85, "r_x3": 308.86, "r_y3": 524.85, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.71, "r_x1": 545.12, "r_y1": 545.71, "r_x2": 545.12, "r_y2": 536.8, "r_x3": 308.86, "r_y3": 536.8, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.66, "r_x1": 545.12, "r_y1": 557.66, "r_x2": 545.12, "r_y2": 548.76, "r_x3": 308.86, "r_y3": 548.76, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.62, "r_x1": 545.12, "r_y1": 569.62, "r_x2": 545.12, "r_y2": 560.71, "r_x3": 308.86, "r_y3": 560.71, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.57, "r_x1": 545.12, "r_y1": 581.57, "r_x2": 545.12, "r_y2": 572.67, "r_x3": 308.86, "r_y3": 572.67, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.53, "r_x1": 545.12, "r_y1": 593.53, "r_x2": 545.12, "r_y2": 584.62, "r_x3": 308.86, "r_y3": 584.62, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.49, "r_x1": 400.47, "r_y1": 605.49, "r_x2": 400.47, "r_y2": 596.58, "r_x3": 308.86, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.38, "r_y0": 605.49, "r_x1": 545.12, "r_y1": 605.49, "r_x2": 545.12, "r_y2": 596.58, "r_x3": 408.38, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.44, "r_x1": 545.12, "r_y1": 617.44, "r_x2": 545.12, "r_y2": 608.53, "r_x3": 308.86, "r_y3": 608.53, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.4, "r_x1": 545.12, "r_y1": 629.4, "r_x2": 545.12, "r_y2": 620.49, "r_x3": 308.86, "r_y3": 620.49, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.35, "r_x1": 545.12, "r_y1": 641.35, "r_x2": 545.12, "r_y2": 632.44, "r_x3": 308.86, "r_y3": 632.44, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.31, "r_x1": 365.86, "r_y1": 653.31, "r_x2": 365.86, "r_y2": 644.4, "r_x3": 308.86, "r_y3": 644.4, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 682.85, "r_x1": 364.41, "r_y1": 682.85, "r_x2": 364.41, "r_y2": 672.1, "r_x3": 308.86, "r_y3": 672.1, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.35, "r_y0": 701.98, "r_x1": 323.81, "r_y1": 701.98, "r_x2": 323.81, "r_y2": 693.96, "r_x3": 313.35, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 326.05, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 545.11, "r_y1": 712.94, "r_x2": 545.11, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 18, "label": "caption", "bbox": { "l": 53.81, "t": 208.23, "r": 385.93, "b": 216.11, "coord_origin": "TOPLEFT" }, "confidence": 0.599, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 216.11, "r_x1": 62.22, "r_y1": 216.11, "r_x2": 62.22, "r_y2": 208.23, "r_x3": 53.81, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.42, "r_y0": 216.11, "r_x1": 385.93, "r_y1": 216.11, "r_x2": 385.93, "r_y2": 208.23, "r_x3": 66.42, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "section_header", "bbox": { "l": 53.81, "t": 94.28, "r": 284.35, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.465, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 102.15, "r_x1": 284.35, "r_y1": 102.15, "r_x2": 284.35, "r_y2": 94.28, "r_x3": 53.81, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "section_header", "bbox": { "l": 304.83, "t": 94.28, "r": 431.09, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.463, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83, "r_y0": 102.15, "r_x1": 431.09, "r_y1": 102.15, "r_x2": 431.09, "r_y2": 94.28, "r_x3": 304.83, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 53.29, "t": 78.69, "r": 61.55, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.582, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.29, "r_y0": 86.56, "r_x1": 61.55, "r_y1": 86.56, "r_x2": 61.55, "r_y2": 78.69, "r_x3": 53.29, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 65.68, "t": 78.69, "r": 499.56, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.541, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.68, "r_y0": 86.56, "r_x1": 499.56, "r_y1": 86.56, "r_x2": 499.56, "r_y2": 78.69, "r_x3": 65.68, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 53.63, "t": 218.95, "r": 298.56, "b": 292.4, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.11, "t": 229.67, "r": 201.29, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.7, "t": 249.59, "r": 103.03, "b": 253.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03, "t": 249.8, "r": 128.96, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.05, "t": 257.07, "r": 93.22, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.22, "t": 257.28, "r": 119.15, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45, "t": 257.07, "r": 129.88, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.18, "t": 264.3, "r": 65.34, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.34, "t": 264.51, "r": 122.38, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45, "t": 264.3, "r": 129.88, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99, "t": 271.53, "r": 109.74, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74, "t": 271.74, "r": 114.93, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.39, "t": 271.53, "r": 122.14, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.14, "t": 271.74, "r": 127.32, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.69, "t": 279.22, "r": 110.17, "b": 283.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 16, "label": "caption", "bbox": { "l": 380.43, "t": 292.3, "r": 549.42, "b": 298.6, "coord_origin": "TOPLEFT" }, "confidence": 0.75, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.43, "r_y0": 298.6, "r_x1": 549.42, "r_y1": 298.6, "r_x2": 549.42, "r_y2": 292.3, "r_x3": 380.43, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "table", "bbox": { "l": 304.92, "t": 218.51, "r": 550.23, "b": 287.9, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82, "t": 227.83, "r": 507.23, "b": 232.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.75, "t": 236.75, "r": 404.65, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.65, "t": 236.75, "r": 407.35, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65, "t": 244.61, "r": 364.66, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.75, "t": 244.91, "r": 403.76, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.98, "t": 244.91, "r": 483.55, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.75, "t": 253.68, "r": 403.76, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73, "t": 261.55, "r": 403.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.74, "t": 261.55, "r": 405.54, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73, "t": 270.32, "r": 403.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.74, "t": 270.32, "r": 405.54, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 320.88, "r": 545.11, "b": 365.65, "coord_origin": "TOPLEFT" }, "confidence": 0.914, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 329.78, "r_x1": 86.86, "r_y1": 329.78, "r_x2": 86.86, "r_y2": 320.88, "r_x3": 50.11, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.92, "r_y0": 329.78, "r_x1": 545.11, "r_y1": 329.78, "r_x2": 545.11, "r_y2": 320.88, "r_x3": 93.92, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 341.74, "r_x1": 545.11, "r_y1": 341.74, "r_x2": 545.11, "r_y2": 332.83, "r_x3": 50.11, "r_y3": 332.83, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 353.69, "r_x1": 545.11, "r_y1": 353.69, "r_x2": 545.11, "r_y2": 344.79, "r_x3": 50.11, "r_y3": 344.79, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.65, "r_x1": 139.8, "r_y1": 365.65, "r_x2": 139.8, "r_y2": 356.74, "r_x3": 50.11, "r_y3": 356.74, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "picture", "bbox": { "l": 216.77, "t": 380.49, "r": 375.78, "b": 443.35, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26, "t": 381.78, "r": 342.08, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 11, "label": "picture", "bbox": { "l": 51.74, "t": 380.48, "r": 211.84, "b": 443.66, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.72, "t": 381.78, "r": 85.66, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 13, "label": "picture", "bbox": { "l": 383.14, "t": 381.23, "r": 542.11, "b": 442.77, "coord_origin": "TOPLEFT" }, "confidence": 0.788, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.38, "t": 400.55, "r": 443.7, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33, "t": 400.55, "r": 456.65, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28, "t": 400.55, "r": 469.6, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.24, "t": 400.55, "r": 482.56, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.19, "t": 400.55, "r": 495.51, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14, "t": 400.55, "r": 508.46, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.1, "t": 400.55, "r": 521.41, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.28, "t": 411.04, "r": 391.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52, "t": 411.04, "r": 404.84, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.48, "t": 411.04, "r": 417.8, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.38, "t": 411.04, "r": 443.7, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33, "t": 411.04, "r": 456.65, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28, "t": 411.04, "r": 469.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.28, "t": 421.07, "r": 391.6, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52, "t": 421.07, "r": 404.84, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.48, "t": 421.07, "r": 417.8, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.43, "t": 421.07, "r": 430.75, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38, "t": 421.07, "r": 443.7, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33, "t": 421.07, "r": 456.65, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.29, "t": 421.07, "r": 469.61, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.24, "t": 421.07, "r": 482.56, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.19, "t": 421.07, "r": 495.51, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14, "t": 421.07, "r": 508.46, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.1, "t": 421.07, "r": 521.42, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.05, "t": 421.07, "r": 534.37, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.28, "t": 432.04, "r": 391.6, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52, "t": 432.04, "r": 404.84, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.48, "t": 432.04, "r": 417.8, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.43, "t": 432.04, "r": 430.75, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38, "t": 432.04, "r": 443.7, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33, "t": 432.04, "r": 456.65, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.29, "t": 432.04, "r": 469.61, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.24, "t": 432.04, "r": 482.56, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.19, "t": 432.04, "r": 495.51, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14, "t": 432.04, "r": 508.46, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.1, "t": 432.04, "r": 521.42, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.05, "t": 432.04, "r": 534.37, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.28, "t": 389.2, "r": 388.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52, "t": 389.2, "r": 401.68, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.48, "t": 389.2, "r": 414.63, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.43, "t": 389.2, "r": 427.59, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.38, "t": 389.2, "r": 440.54, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33, "t": 389.2, "r": 453.49, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28, "t": 389.2, "r": 466.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.24, "t": 389.2, "r": 479.39, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.19, "t": 389.2, "r": 492.35, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.14, "t": 389.2, "r": 505.3, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09, "t": 389.2, "r": 521.41, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04, "t": 389.2, "r": 534.13, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.28, "t": 398.97, "r": 391.6, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52, "t": 398.97, "r": 404.84, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.48, "t": 398.97, "r": 417.8, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.43, "t": 406.77, "r": 430.75, "b": 413.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.87, "t": 410.99, "r": 509.19, "b": 417.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35, "t": 381.78, "r": 430.99, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "caption", "bbox": { "l": 62.6, "t": 458.73, "r": 532.63, "b": 467.63, "coord_origin": "TOPLEFT" }, "confidence": 0.915, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.6, "r_y0": 467.63, "r_x1": 532.63, "r_y1": 467.63, "r_x2": 532.63, "r_y2": 458.73, "r_x3": 62.6, "r_y3": 458.73, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "section_header", "bbox": { "l": 50.11, "t": 491.4, "r": 163.76, "b": 501.25, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.25, "r_x1": 64.45, "r_y1": 501.25, "r_x2": 64.45, "r_y2": 491.4, "r_x3": 50.11, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.01, "r_y0": 501.25, "r_x1": 163.76, "r_y1": 501.25, "r_x2": 163.76, "r_y2": 491.4, "r_x3": 74.01, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 536.87, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 545.78, "r_x1": 286.36, "r_y1": 545.78, "r_x2": 286.36, "r_y2": 536.87, "r_x3": 62.07, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 557.73, "r_x1": 211.16, "r_y1": 557.73, "r_x2": 211.16, "r_y2": 548.83, "r_x3": 50.11, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.1, "r_y0": 557.51, "r_x1": 259.17, "r_y1": 557.51, "r_x2": 259.17, "r_y2": 548.92, "r_x3": 215.1, "r_y3": 548.92, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73, "r_x1": 286.36, "r_y1": 557.73, "r_x2": 286.36, "r_y2": 548.83, "r_x3": 263.12, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 569.69, "r_x1": 286.37, "r_y1": 569.69, "r_x2": 286.37, "r_y2": 560.78, "r_x3": 50.11, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 226.89, "r_y1": 713.15, "r_x2": 226.89, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 308.86, "t": 490.71, "r": 460.85, "b": 501.46, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 501.46, "r_x1": 316.07, "r_y1": 501.46, "r_x2": 316.07, "r_y2": 490.71, "r_x3": 308.86, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.69, "r_y0": 501.46, "r_x1": 460.85, "r_y1": 501.46, "r_x2": 460.85, "r_y2": 490.71, "r_x3": 325.69, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 512.89, "r": 545.12, "b": 653.31, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 521.8, "r_x1": 545.12, "r_y1": 521.8, "r_x2": 545.12, "r_y2": 512.89, "r_x3": 320.82, "r_y3": 512.89, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.75, "r_x1": 545.12, "r_y1": 533.75, "r_x2": 545.12, "r_y2": 524.85, "r_x3": 308.86, "r_y3": 524.85, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.71, "r_x1": 545.12, "r_y1": 545.71, "r_x2": 545.12, "r_y2": 536.8, "r_x3": 308.86, "r_y3": 536.8, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.66, "r_x1": 545.12, "r_y1": 557.66, "r_x2": 545.12, "r_y2": 548.76, "r_x3": 308.86, "r_y3": 548.76, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.62, "r_x1": 545.12, "r_y1": 569.62, "r_x2": 545.12, "r_y2": 560.71, "r_x3": 308.86, "r_y3": 560.71, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.57, "r_x1": 545.12, "r_y1": 581.57, "r_x2": 545.12, "r_y2": 572.67, "r_x3": 308.86, "r_y3": 572.67, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.53, "r_x1": 545.12, "r_y1": 593.53, "r_x2": 545.12, "r_y2": 584.62, "r_x3": 308.86, "r_y3": 584.62, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.49, "r_x1": 400.47, "r_y1": 605.49, "r_x2": 400.47, "r_y2": 596.58, "r_x3": 308.86, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.38, "r_y0": 605.49, "r_x1": 545.12, "r_y1": 605.49, "r_x2": 545.12, "r_y2": 596.58, "r_x3": 408.38, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.44, "r_x1": 545.12, "r_y1": 617.44, "r_x2": 545.12, "r_y2": 608.53, "r_x3": 308.86, "r_y3": 608.53, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.4, "r_x1": 545.12, "r_y1": 629.4, "r_x2": 545.12, "r_y2": 620.49, "r_x3": 308.86, "r_y3": 620.49, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.35, "r_x1": 545.12, "r_y1": 641.35, "r_x2": 545.12, "r_y2": 632.44, "r_x3": 308.86, "r_y3": 632.44, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.31, "r_x1": 365.86, "r_y1": 653.31, "r_x2": 365.86, "r_y2": 644.4, "r_x3": 308.86, "r_y3": 644.4, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 308.86, "t": 672.1, "r": 364.41, "b": 682.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 682.85, "r_x1": 364.41, "r_y1": 682.85, "r_x2": 364.41, "r_y2": 672.1, "r_x3": 308.86, "r_y3": 672.1, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 313.35, "t": 693.96, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.832, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.35, "r_y0": 701.98, "r_x1": 323.81, "r_y1": 701.98, "r_x2": 323.81, "r_y2": 693.96, "r_x3": 313.35, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 326.05, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 545.11, "r_y1": 712.94, "r_x2": 545.11, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.871, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "picture", "bbox": { "l": 305.58, "t": 98.65, "r": 554.83, "b": 180.63, "coord_origin": "TOPLEFT" }, "confidence": 0.77, "cells": [], "children": [] }, { "id": 14, "label": "picture", "bbox": { "l": 49.98, "t": 103.71, "r": 301.63, "b": 187.58, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "8": { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.63, "t": 218.95, "r": 298.56, "b": 292.4, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.11, "t": 229.67, "r": 201.29, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.7, "t": 249.59, "r": 103.03, "b": 253.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03, "t": 249.8, "r": 128.96, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.05, "t": 257.07, "r": 93.22, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.22, "t": 257.28, "r": 119.15, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45, "t": 257.07, "r": 129.88, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.18, "t": 264.3, "r": 65.34, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.34, "t": 264.51, "r": 122.38, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45, "t": 264.3, "r": 129.88, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99, "t": 271.53, "r": 109.74, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74, "t": 271.74, "r": 114.93, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.39, "t": 271.53, "r": 122.14, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.14, "t": 271.74, "r": 127.32, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.69, "t": 279.22, "r": 110.17, "b": 283.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, "7": { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.92, "t": 218.51, "r": 550.23, "b": 287.9, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82, "t": 227.83, "r": 507.23, "b": 232.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.75, "t": 236.75, "r": 404.65, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.65, "t": 236.75, "r": 407.35, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65, "t": 244.61, "r": 364.66, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.75, "t": 244.91, "r": 403.76, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.98, "t": 244.91, "r": 483.55, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.75, "t": 253.68, "r": 403.76, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73, "t": 261.55, "r": 403.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.74, "t": 261.55, "r": 405.54, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73, "t": 270.32, "r": 403.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.74, "t": 270.32, "r": 405.54, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 18, "page_no": 7, "cluster": { "id": 18, "label": "caption", "bbox": { "l": 53.81, "t": 208.23, "r": 385.93, "b": 216.11, "coord_origin": "TOPLEFT" }, "confidence": 0.599, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 216.11, "r_x1": 62.22, "r_y1": 216.11, "r_x2": 62.22, "r_y2": 208.23, "r_x3": 53.81, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.42, "r_y0": 216.11, "r_x1": 385.93, "r_y1": 216.11, "r_x2": 385.93, "r_y2": 208.23, "r_x3": 66.42, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:" }, { "label": "section_header", "id": 29, "page_no": 7, "cluster": { "id": 29, "label": "section_header", "bbox": { "l": 53.81, "t": 94.28, "r": 284.35, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.465, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 102.15, "r_x1": 284.35, "r_y1": 102.15, "r_x2": 284.35, "r_y2": 94.28, "r_x3": 53.81, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Japanese language (previously unseen by TableFormer):" }, { "label": "section_header", "id": 31, "page_no": 7, "cluster": { "id": 31, "label": "section_header", "bbox": { "l": 304.83, "t": 94.28, "r": 431.09, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.463, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83, "r_y0": 102.15, "r_x1": 431.09, "r_y1": 102.15, "r_x2": 431.09, "r_y2": 94.28, "r_x3": 304.83, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Example table from FinTabNet:" }, { "label": "list_item", "id": 20, "page_no": 7, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 53.29, "t": 78.69, "r": 61.55, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.582, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.29, "r_y0": 86.56, "r_x1": 61.55, "r_y1": 86.56, "r_x2": 61.55, "r_y2": 78.69, "r_x3": 53.29, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a." }, { "label": "list_item", "id": 21, "page_no": 7, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 65.68, "t": 78.69, "r": 499.56, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.541, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.68, "r_y0": 86.56, "r_x1": 499.56, "r_y1": 86.56, "r_x2": 499.56, "r_y2": 78.69, "r_x3": 65.68, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells" }, { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.63, "t": 218.95, "r": 298.56, "b": 292.4, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.11, "t": 229.67, "r": 201.29, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.7, "t": 249.59, "r": 103.03, "b": 253.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03, "t": 249.8, "r": 128.96, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.05, "t": 257.07, "r": 93.22, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.22, "t": 257.28, "r": 119.15, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45, "t": 257.07, "r": 129.88, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.18, "t": 264.3, "r": 65.34, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.34, "t": 264.51, "r": 122.38, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45, "t": 264.3, "r": 129.88, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99, "t": 271.53, "r": 109.74, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74, "t": 271.74, "r": 114.93, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.39, "t": 271.53, "r": 122.14, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.14, "t": 271.74, "r": 127.32, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.69, "t": 279.22, "r": 110.17, "b": 283.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 16, "page_no": 7, "cluster": { "id": 16, "label": "caption", "bbox": { "l": 380.43, "t": 292.3, "r": 549.42, "b": 298.6, "coord_origin": "TOPLEFT" }, "confidence": 0.75, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.43, "r_y0": 298.6, "r_x1": 549.42, "r_y1": 298.6, "r_x2": 549.42, "r_y2": 292.3, "r_x3": 380.43, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Text is aligned to match original for ease of viewing" }, { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.92, "t": 218.51, "r": 550.23, "b": 287.9, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82, "t": 227.83, "r": 507.23, "b": 232.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.75, "t": 236.75, "r": 404.65, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.65, "t": 236.75, "r": 407.35, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65, "t": 244.61, "r": 364.66, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.75, "t": 244.91, "r": 403.76, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.98, "t": 244.91, "r": 483.55, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.75, "t": 253.68, "r": 403.76, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73, "t": 261.55, "r": 403.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.74, "t": 261.55, "r": 405.54, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73, "t": 270.32, "r": 403.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.74, "t": 270.32, "r": 405.54, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 320.88, "r": 545.11, "b": 365.65, "coord_origin": "TOPLEFT" }, "confidence": 0.914, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 329.78, "r_x1": 86.86, "r_y1": 329.78, "r_x2": 86.86, "r_y2": 320.88, "r_x3": 50.11, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.92, "r_y0": 329.78, "r_x1": 545.11, "r_y1": 329.78, "r_x2": 545.11, "r_y2": 320.88, "r_x3": 93.92, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 341.74, "r_x1": 545.11, "r_y1": 341.74, "r_x2": 545.11, "r_y2": 332.83, "r_x3": 50.11, "r_y3": 332.83, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 353.69, "r_x1": 545.11, "r_y1": 353.69, "r_x2": 545.11, "r_y2": 344.79, "r_x3": 50.11, "r_y3": 344.79, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.65, "r_x1": 139.8, "r_y1": 365.65, "r_x2": 139.8, "r_y2": 356.74, "r_x3": 50.11, "r_y3": 356.74, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset." }, { "label": "picture", "id": 12, "page_no": 7, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 216.77, "t": 380.49, "r": 375.78, "b": 443.35, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26, "t": 381.78, "r": 342.08, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 11, "page_no": 7, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 51.74, "t": 380.48, "r": 211.84, "b": 443.66, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.72, "t": 381.78, "r": 85.66, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 13, "page_no": 7, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 383.14, "t": 381.23, "r": 542.11, "b": 442.77, "coord_origin": "TOPLEFT" }, "confidence": 0.788, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.38, "t": 400.55, "r": 443.7, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33, "t": 400.55, "r": 456.65, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28, "t": 400.55, "r": 469.6, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.24, "t": 400.55, "r": 482.56, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.19, "t": 400.55, "r": 495.51, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14, "t": 400.55, "r": 508.46, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.1, "t": 400.55, "r": 521.41, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.28, "t": 411.04, "r": 391.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52, "t": 411.04, "r": 404.84, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.48, "t": 411.04, "r": 417.8, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.38, "t": 411.04, "r": 443.7, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33, "t": 411.04, "r": 456.65, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28, "t": 411.04, "r": 469.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.28, "t": 421.07, "r": 391.6, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52, "t": 421.07, "r": 404.84, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.48, "t": 421.07, "r": 417.8, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.43, "t": 421.07, "r": 430.75, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38, "t": 421.07, "r": 443.7, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33, "t": 421.07, "r": 456.65, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.29, "t": 421.07, "r": 469.61, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.24, "t": 421.07, "r": 482.56, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.19, "t": 421.07, "r": 495.51, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14, "t": 421.07, "r": 508.46, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.1, "t": 421.07, "r": 521.42, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.05, "t": 421.07, "r": 534.37, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.28, "t": 432.04, "r": 391.6, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52, "t": 432.04, "r": 404.84, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.48, "t": 432.04, "r": 417.8, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.43, "t": 432.04, "r": 430.75, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38, "t": 432.04, "r": 443.7, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33, "t": 432.04, "r": 456.65, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.29, "t": 432.04, "r": 469.61, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.24, "t": 432.04, "r": 482.56, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.19, "t": 432.04, "r": 495.51, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14, "t": 432.04, "r": 508.46, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.1, "t": 432.04, "r": 521.42, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.05, "t": 432.04, "r": 534.37, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.28, "t": 389.2, "r": 388.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52, "t": 389.2, "r": 401.68, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.48, "t": 389.2, "r": 414.63, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.43, "t": 389.2, "r": 427.59, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.38, "t": 389.2, "r": 440.54, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33, "t": 389.2, "r": 453.49, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28, "t": 389.2, "r": 466.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.24, "t": 389.2, "r": 479.39, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.19, "t": 389.2, "r": 492.35, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.14, "t": 389.2, "r": 505.3, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09, "t": 389.2, "r": 521.41, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04, "t": 389.2, "r": 534.13, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.28, "t": 398.97, "r": 391.6, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52, "t": 398.97, "r": 404.84, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.48, "t": 398.97, "r": 417.8, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.43, "t": 406.77, "r": 430.75, "b": 413.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.87, "t": 410.99, "r": 509.19, "b": 417.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35, "t": 381.78, "r": 430.99, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 62.6, "t": 458.73, "r": 532.63, "b": 467.63, "coord_origin": "TOPLEFT" }, "confidence": 0.915, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.6, "r_y0": 467.63, "r_x1": 532.63, "r_y1": 467.63, "r_x2": 532.63, "r_y2": 458.73, "r_x3": 62.6, "r_y3": 458.73, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 50.11, "t": 491.4, "r": 163.76, "b": 501.25, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.25, "r_x1": 64.45, "r_y1": 501.25, "r_x2": 64.45, "r_y2": 491.4, "r_x3": 50.11, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.01, "r_y0": 501.25, "r_x1": 163.76, "r_y1": 501.25, "r_x2": 163.76, "r_y2": 491.4, "r_x3": 74.01, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.5. Qualitative Analysis" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 536.87, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 545.78, "r_x1": 286.36, "r_y1": 545.78, "r_x2": 286.36, "r_y2": 536.87, "r_x3": 62.07, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 557.73, "r_x1": 211.16, "r_y1": 557.73, "r_x2": 211.16, "r_y2": 548.83, "r_x3": 50.11, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.1, "r_y0": 557.51, "r_x1": 259.17, "r_y1": 557.51, "r_x2": 259.17, "r_y2": 548.92, "r_x3": 215.1, "r_y3": 548.92, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73, "r_x1": 286.36, "r_y1": 557.73, "r_x2": 286.36, "r_y2": 548.83, "r_x3": 263.12, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 569.69, "r_x1": 286.37, "r_y1": 569.69, "r_x2": 286.37, "r_y2": 560.78, "r_x3": 50.11, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 226.89, "r_y1": 713.15, "r_x2": 226.89, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type." }, { "label": "section_header", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 308.86, "t": 490.71, "r": 460.85, "b": 501.46, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 501.46, "r_x1": 316.07, "r_y1": 501.46, "r_x2": 316.07, "r_y2": 490.71, "r_x3": 308.86, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.69, "r_y0": 501.46, "r_x1": 460.85, "r_y1": 501.46, "r_x2": 460.85, "r_y2": 490.71, "r_x3": 325.69, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Future Work & Conclusion" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 512.89, "r": 545.12, "b": 653.31, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 521.8, "r_x1": 545.12, "r_y1": 521.8, "r_x2": 545.12, "r_y2": 512.89, "r_x3": 320.82, "r_y3": 512.89, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.75, "r_x1": 545.12, "r_y1": 533.75, "r_x2": 545.12, "r_y2": 524.85, "r_x3": 308.86, "r_y3": 524.85, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.71, "r_x1": 545.12, "r_y1": 545.71, "r_x2": 545.12, "r_y2": 536.8, "r_x3": 308.86, "r_y3": 536.8, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.66, "r_x1": 545.12, "r_y1": 557.66, "r_x2": 545.12, "r_y2": 548.76, "r_x3": 308.86, "r_y3": 548.76, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.62, "r_x1": 545.12, "r_y1": 569.62, "r_x2": 545.12, "r_y2": 560.71, "r_x3": 308.86, "r_y3": 560.71, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.57, "r_x1": 545.12, "r_y1": 581.57, "r_x2": 545.12, "r_y2": 572.67, "r_x3": 308.86, "r_y3": 572.67, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.53, "r_x1": 545.12, "r_y1": 593.53, "r_x2": 545.12, "r_y2": 584.62, "r_x3": 308.86, "r_y3": 584.62, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.49, "r_x1": 400.47, "r_y1": 605.49, "r_x2": 400.47, "r_y2": 596.58, "r_x3": 308.86, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.38, "r_y0": 605.49, "r_x1": 545.12, "r_y1": 605.49, "r_x2": 545.12, "r_y2": 596.58, "r_x3": 408.38, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.44, "r_x1": 545.12, "r_y1": 617.44, "r_x2": 545.12, "r_y2": 608.53, "r_x3": 308.86, "r_y3": 608.53, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.4, "r_x1": 545.12, "r_y1": 629.4, "r_x2": 545.12, "r_y2": 620.49, "r_x3": 308.86, "r_y3": 620.49, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.35, "r_x1": 545.12, "r_y1": 641.35, "r_x2": 545.12, "r_y2": 632.44, "r_x3": 308.86, "r_y3": 632.44, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.31, "r_x1": 365.86, "r_y1": 653.31, "r_x2": 365.86, "r_y2": 644.4, "r_x3": 308.86, "r_y3": 644.4, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 308.86, "t": 672.1, "r": 364.41, "b": 682.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 682.85, "r_x1": 364.41, "r_y1": 682.85, "r_x2": 364.41, "r_y2": 672.1, "r_x3": 308.86, "r_y3": 672.1, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 10, "page_no": 7, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 313.35, "t": 693.96, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.832, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.35, "r_y0": 701.98, "r_x1": 323.81, "r_y1": 701.98, "r_x2": 323.81, "r_y2": 693.96, "r_x3": 313.35, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 326.05, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 545.11, "r_y1": 712.94, "r_x2": 545.11, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-" }, { "label": "page_footer", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.871, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "picture", "id": 15, "page_no": 7, "cluster": { "id": 15, "label": "picture", "bbox": { "l": 305.58, "t": 98.65, "r": 554.83, "b": 180.63, "coord_origin": "TOPLEFT" }, "confidence": 0.77, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 14, "page_no": 7, "cluster": { "id": 14, "label": "picture", "bbox": { "l": 49.98, "t": 103.71, "r": 301.63, "b": 187.58, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 18, "page_no": 7, "cluster": { "id": 18, "label": "caption", "bbox": { "l": 53.81, "t": 208.23, "r": 385.93, "b": 216.11, "coord_origin": "TOPLEFT" }, "confidence": 0.599, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 216.11, "r_x1": 62.22, "r_y1": 216.11, "r_x2": 62.22, "r_y2": 208.23, "r_x3": 53.81, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.42, "r_y0": 216.11, "r_x1": 385.93, "r_y1": 216.11, "r_x2": 385.93, "r_y2": 208.23, "r_x3": 66.42, "r_y3": 208.23, "coord_origin": "TOPLEFT" }, "text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:" }, { "label": "section_header", "id": 29, "page_no": 7, "cluster": { "id": 29, "label": "section_header", "bbox": { "l": 53.81, "t": 94.28, "r": 284.35, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.465, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.81, "r_y0": 102.15, "r_x1": 284.35, "r_y1": 102.15, "r_x2": 284.35, "r_y2": 94.28, "r_x3": 53.81, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Japanese language (previously unseen by TableFormer):" }, { "label": "section_header", "id": 31, "page_no": 7, "cluster": { "id": 31, "label": "section_header", "bbox": { "l": 304.83, "t": 94.28, "r": 431.09, "b": 102.15, "coord_origin": "TOPLEFT" }, "confidence": 0.463, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 304.83, "r_y0": 102.15, "r_x1": 431.09, "r_y1": 102.15, "r_x2": 431.09, "r_y2": 94.28, "r_x3": 304.83, "r_y3": 94.28, "coord_origin": "TOPLEFT" }, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Example table from FinTabNet:" }, { "label": "list_item", "id": 20, "page_no": 7, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 53.29, "t": 78.69, "r": 61.55, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.582, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.29, "r_y0": 86.56, "r_x1": 61.55, "r_y1": 86.56, "r_x2": 61.55, "r_y2": 78.69, "r_x3": 53.29, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "a.", "orig": "a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "a." }, { "label": "list_item", "id": 21, "page_no": 7, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 65.68, "t": 78.69, "r": 499.56, "b": 86.56, "coord_origin": "TOPLEFT" }, "confidence": 0.541, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.68, "r_y0": 86.56, "r_x1": 499.56, "r_y1": 86.56, "r_x2": 499.56, "r_y2": 78.69, "r_x3": 65.68, "r_y3": 78.69, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells" }, { "label": "table", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "table", "bbox": { "l": 53.63, "t": 218.95, "r": 298.56, "b": 292.4, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 55, "label": "text", "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.93, "r_y0": 226.36, "r_x1": 241.04, "r_y1": 226.36, "r_x2": 241.04, "r_y2": 222.18, "r_x3": 209.93, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.76, "r_y0": 226.36, "r_x1": 284.51, "r_y1": 226.36, "r_x2": 284.51, "r_y2": 222.18, "r_x3": 263.76, "r_y3": 222.18, "coord_origin": "TOPLEFT" }, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.25, "r_y0": 233.85, "r_x1": 120.62, "r_y1": 233.85, "r_x2": 120.62, "r_y2": 229.67, "r_x3": 110.25, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 175.37, "r_y0": 233.85, "r_x1": 196.11, "r_y1": 233.85, "r_x2": 196.11, "r_y2": 229.67, "r_x3": 175.37, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u30d5\u30a1\u30a4\u30eb", "orig": "\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 196.11, "t": 229.67, "r": 201.29, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.11, "r_y0": 233.85, "r_x1": 201.29, "r_y1": 233.85, "r_x2": 201.29, "r_y2": 229.67, "r_x3": 196.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u6570", "orig": "\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.62, "r_y0": 233.85, "r_x1": 219.99, "r_y1": 233.85, "r_x2": 219.99, "r_y2": 229.67, "r_x3": 209.62, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.2, "r_y0": 233.85, "r_x1": 244.75, "r_y1": 233.85, "r_x2": 244.75, "r_y2": 229.67, "r_x3": 229.2, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.11, "r_y0": 233.85, "r_x1": 266.48, "r_y1": 233.85, "r_x2": 266.48, "r_y2": 229.67, "r_x3": 256.11, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.38, "r_y0": 233.85, "r_x1": 293.94, "r_y1": 233.85, "r_x2": 293.94, "r_y2": 229.67, "r_x3": 278.38, "r_y3": 229.67, "coord_origin": "TOPLEFT" }, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 240.78, "r_x1": 162.71, "r_y1": 240.78, "r_x2": 162.71, "r_y2": 236.43, "r_x3": 55.53, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 240.78, "r_x1": 189.56, "r_y1": 240.78, "r_x2": 189.56, "r_y2": 236.43, "r_x3": 184.4, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 240.78, "r_x1": 214.16, "r_y1": 240.78, "r_x2": 214.16, "r_y2": 236.43, "r_x3": 208.99, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 240.78, "r_x1": 237.46, "r_y1": 240.78, "r_x2": 237.46, "r_y2": 236.43, "r_x3": 234.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 240.78, "r_x1": 264.64, "r_y1": 240.78, "r_x2": 264.64, "r_y2": 236.43, "r_x3": 256.88, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 240.78, "r_x1": 286.64, "r_y1": 240.78, "r_x2": 286.64, "r_y2": 236.43, "r_x3": 284.06, "r_y3": 236.43, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 246.98, "r_x1": 139.72, "r_y1": 246.98, "r_x2": 139.72, "r_y2": 242.62, "r_x3": 55.53, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 246.98, "r_x1": 190.86, "r_y1": 246.98, "r_x2": 190.86, "r_y2": 242.62, "r_x3": 183.11, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 246.98, "r_x1": 215.45, "r_y1": 246.98, "r_x2": 215.45, "r_y2": 242.62, "r_x3": 207.7, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.88, "r_y0": 246.98, "r_x1": 237.46, "r_y1": 246.98, "r_x2": 237.46, "r_y2": 242.62, "r_x3": 234.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 246.98, "r_x1": 264.64, "r_y1": 246.98, "r_x2": 264.64, "r_y2": 242.62, "r_x3": 256.88, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.06, "r_y0": 246.98, "r_x1": 286.64, "r_y1": 246.98, "r_x2": 286.64, "r_y2": 242.62, "r_x3": 284.06, "r_y3": 242.62, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 253.98, "r_x1": 97.01, "r_y1": 253.98, "r_x2": 97.01, "r_y2": 249.8, "r_x3": 55.53, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 92.7, "t": 249.59, "r": 103.03, "b": 253.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 92.7, "r_y0": 253.95, "r_x1": 103.03, "r_y1": 253.95, "r_x2": 103.03, "r_y2": 249.59, "r_x3": 92.7, "r_y3": 249.59, "coord_origin": "TOPLEFT" }, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 103.03, "t": 249.8, "r": 128.96, "b": 253.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.03, "r_y0": 253.98, "r_x1": 128.96, "r_y1": 253.98, "r_x2": 128.96, "r_y2": 249.8, "r_x3": 103.03, "r_y3": 249.8, "coord_origin": "TOPLEFT" }, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 253.17, "r_x1": 190.86, "r_y1": 253.17, "r_x2": 190.86, "r_y2": 248.82, "r_x3": 183.11, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 253.17, "r_x1": 212.87, "r_y1": 253.17, "r_x2": 212.87, "r_y2": 248.82, "r_x3": 210.28, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 253.17, "r_x1": 240.04, "r_y1": 253.17, "r_x2": 240.04, "r_y2": 248.82, "r_x3": 232.29, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 253.17, "r_x1": 264.64, "r_y1": 253.17, "r_x2": 264.64, "r_y2": 248.82, "r_x3": 256.88, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 253.17, "r_x1": 289.23, "r_y1": 253.17, "r_x2": 289.23, "r_y2": 248.82, "r_x3": 281.48, "r_y3": 248.82, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 261.47, "r_x1": 91.83, "r_y1": 261.47, "r_x2": 91.83, "r_y2": 257.28, "r_x3": 55.53, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 88.05, "t": 257.07, "r": 93.22, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 88.05, "r_y0": 261.43, "r_x1": 93.22, "r_y1": 261.43, "r_x2": 93.22, "r_y2": 257.07, "r_x3": 88.05, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 93.22, "t": 257.28, "r": 119.15, "b": 261.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.22, "r_y0": 261.47, "r_x1": 119.15, "r_y1": 261.47, "r_x2": 119.15, "r_y2": 257.28, "r_x3": 93.22, "r_y3": 257.28, "coord_origin": "TOPLEFT" }, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 116.45, "t": 257.07, "r": 129.88, "b": 261.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 261.43, "r_x1": 129.88, "r_y1": 261.43, "r_x2": 129.88, "r_y2": 257.07, "r_x3": 116.45, "r_y3": 257.07, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 260.66, "r_x1": 190.86, "r_y1": 260.66, "r_x2": 190.86, "r_y2": 256.3, "r_x3": 183.11, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 260.66, "r_x1": 212.87, "r_y1": 260.66, "r_x2": 212.87, "r_y2": 256.3, "r_x3": 210.28, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 260.66, "r_x1": 240.04, "r_y1": 260.66, "r_x2": 240.04, "r_y2": 256.3, "r_x3": 232.29, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 260.66, "r_x1": 264.64, "r_y1": 260.66, "r_x2": 264.64, "r_y2": 256.3, "r_x3": 256.88, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 260.66, "r_x1": 289.23, "r_y1": 260.66, "r_x2": 289.23, "r_y2": 256.3, "r_x3": 281.48, "r_y3": 256.3, "coord_origin": "TOPLEFT" }, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 268.69, "r_x1": 60.72, "r_y1": 268.69, "r_x2": 60.72, "r_y2": 264.51, "r_x3": 55.53, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 60.18, "t": 264.3, "r": 65.34, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.18, "r_y0": 268.66, "r_x1": 65.34, "r_y1": 268.66, "r_x2": 65.34, "r_y2": 264.3, "r_x3": 60.18, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 65.34, "t": 264.51, "r": 122.38, "b": 268.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 65.34, "r_y0": 268.69, "r_x1": 122.38, "r_y1": 268.69, "r_x2": 122.38, "r_y2": 264.51, "r_x3": 65.34, "r_y3": 264.51, "coord_origin": "TOPLEFT" }, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 116.45, "t": 264.3, "r": 129.88, "b": 268.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.45, "r_y0": 268.66, "r_x1": 129.88, "r_y1": 268.66, "r_x2": 129.88, "r_y2": 264.3, "r_x3": 116.45, "r_y3": 264.3, "coord_origin": "TOPLEFT" }, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 267.89, "r_x1": 190.86, "r_y1": 267.89, "r_x2": 190.86, "r_y2": 263.53, "r_x3": 183.11, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 267.89, "r_x1": 212.87, "r_y1": 267.89, "r_x2": 212.87, "r_y2": 263.53, "r_x3": 210.28, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 267.89, "r_x1": 240.04, "r_y1": 267.89, "r_x2": 240.04, "r_y2": 263.53, "r_x3": 232.29, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 267.89, "r_x1": 264.64, "r_y1": 267.89, "r_x2": 264.64, "r_y2": 263.53, "r_x3": 256.88, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 267.89, "r_x1": 289.23, "r_y1": 267.89, "r_x2": 289.23, "r_y2": 263.53, "r_x3": 281.48, "r_y3": 263.53, "coord_origin": "TOPLEFT" }, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 275.92, "r_x1": 107.38, "r_y1": 275.92, "r_x2": 107.38, "r_y2": 271.74, "r_x3": 55.53, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 101.99, "t": 271.53, "r": 109.74, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 101.99, "r_y0": 275.89, "r_x1": 109.74, "r_y1": 275.89, "r_x2": 109.74, "r_y2": 271.53, "r_x3": 101.99, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 109.74, "t": 271.74, "r": 114.93, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 109.74, "r_y0": 275.92, "r_x1": 114.93, "r_y1": 275.92, "r_x2": 114.93, "r_y2": 271.74, "r_x3": 109.74, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 114.39, "t": 271.53, "r": 122.14, "b": 275.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 114.39, "r_y0": 275.89, "r_x1": 122.14, "r_y1": 275.89, "r_x2": 122.14, "r_y2": 271.53, "r_x3": 114.39, "r_y3": 271.53, "coord_origin": "TOPLEFT" }, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 122.14, "t": 271.74, "r": 127.32, "b": 275.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.14, "r_y0": 275.92, "r_x1": 127.32, "r_y1": 275.92, "r_x2": 127.32, "r_y2": 271.74, "r_x3": 122.14, "r_y3": 271.74, "coord_origin": "TOPLEFT" }, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 184.4, "r_y0": 275.11, "r_x1": 189.56, "r_y1": 275.11, "r_x2": 189.56, "r_y2": 270.75, "r_x3": 184.4, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.28, "r_y0": 275.11, "r_x1": 212.87, "r_y1": 275.11, "r_x2": 212.87, "r_y2": 270.75, "r_x3": 210.28, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 275.11, "r_x1": 238.75, "r_y1": 275.11, "r_x2": 238.75, "r_y2": 270.75, "r_x3": 233.58, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 275.11, "r_x1": 264.64, "r_y1": 275.11, "r_x2": 264.64, "r_y2": 270.75, "r_x3": 256.88, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 275.11, "r_x1": 289.23, "r_y1": 275.11, "r_x2": 289.23, "r_y2": 270.75, "r_x3": 281.48, "r_y3": 270.75, "coord_origin": "TOPLEFT" }, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 55.53, "r_y0": 283.37, "r_x1": 68.69, "r_y1": 283.37, "r_x2": 68.69, "r_y2": 279.01, "r_x3": 55.53, "r_y3": 279.01, "coord_origin": "TOPLEFT" }, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 68.69, "t": 279.22, "r": 110.17, "b": 283.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.69, "r_y0": 283.4, "r_x1": 110.17, "r_y1": 283.4, "r_x2": 110.17, "r_y2": 279.22, "r_x3": 68.69, "r_y3": 279.22, "coord_origin": "TOPLEFT" }, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 282.34, "r_x1": 190.86, "r_y1": 282.34, "r_x2": 190.86, "r_y2": 277.98, "r_x3": 183.11, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.99, "r_y0": 282.34, "r_x1": 214.16, "r_y1": 282.34, "r_x2": 214.16, "r_y2": 277.98, "r_x3": 208.99, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.58, "r_y0": 282.34, "r_x1": 238.75, "r_y1": 282.34, "r_x2": 238.75, "r_y2": 277.98, "r_x3": 233.58, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 256.88, "r_y0": 282.34, "r_x1": 264.64, "r_y1": 282.34, "r_x2": 264.64, "r_y2": 277.98, "r_x3": 256.88, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.77, "r_y0": 282.34, "r_x1": 287.94, "r_y1": 282.34, "r_x2": 287.94, "r_y2": 277.98, "r_x3": 282.77, "r_y3": 277.98, "coord_origin": "TOPLEFT" }, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.62, "r_y0": 290.63, "r_x1": 174.8, "r_y1": 290.63, "r_x2": 174.8, "r_y2": 286.45, "r_x3": 169.62, "r_y3": 286.45, "coord_origin": "TOPLEFT" }, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.11, "r_y0": 289.82, "r_x1": 190.86, "r_y1": 289.82, "r_x2": 190.86, "r_y2": 285.47, "r_x3": 183.11, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.7, "r_y0": 289.82, "r_x1": 215.45, "r_y1": 289.82, "r_x2": 215.45, "r_y2": 285.47, "r_x3": 207.7, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.29, "r_y0": 289.82, "r_x1": 240.04, "r_y1": 289.82, "r_x2": 240.04, "r_y2": 285.47, "r_x3": 232.29, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.77, "r_y0": 289.82, "r_x1": 265.75, "r_y1": 289.82, "r_x2": 265.75, "r_y2": 285.47, "r_x3": 255.77, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 281.48, "r_y0": 289.82, "r_x1": 289.23, "r_y1": 289.82, "r_x2": 289.23, "r_y2": 285.47, "r_x3": 281.48, "r_y3": 285.47, "coord_origin": "TOPLEFT" }, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 10, "num_cols": 6, "table_cells": [ { "bbox": { "l": 209.93, "t": 222.18, "r": 241.04, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 263.76, "t": 222.18, "r": 284.51, "b": 226.36, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 110.25, "t": 229.67, "r": 120.62, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 175.37, "t": 229.67, "r": 196.11, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb \u6570", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 209.62, "t": 229.67, "r": 219.99, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 229.2, "t": 229.67, "r": 244.75, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 256.11, "t": 229.67, "r": 266.48, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 278.38, "t": 229.67, "r": 293.94, "b": 233.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 236.43, "r": 162.71, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 236.43, "r": 189.56, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 236.43, "r": 214.16, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 236.43, "r": 237.46, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 236.43, "r": 264.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 236.43, "r": 286.64, "b": 240.78, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 242.62, "r": 139.72, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 242.62, "r": 190.86, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 242.62, "r": 215.45, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 234.88, "t": 242.62, "r": 237.46, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 242.62, "r": 264.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 284.06, "t": 242.62, "r": 286.64, "b": 246.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 249.8, "r": 97.01, "b": 253.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 248.82, "r": 190.86, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 248.82, "r": 212.87, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 248.82, "r": 240.04, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 248.82, "r": 264.64, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 248.82, "r": 289.23, "b": 253.17, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 257.28, "r": 91.83, "b": 261.47, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 256.3, "r": 190.86, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 256.3, "r": 212.87, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 256.3, "r": 240.04, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 256.3, "r": 264.64, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 256.3, "r": 289.23, "b": 260.66, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 264.51, "r": 60.72, "b": 268.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 263.53, "r": 190.86, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 263.53, "r": 212.87, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 263.53, "r": 240.04, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 263.53, "r": 264.64, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 263.53, "r": 289.23, "b": 267.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 271.74, "r": 107.38, "b": 275.92, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 184.4, "t": 270.75, "r": 189.56, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 210.28, "t": 270.75, "r": 212.87, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 270.75, "r": 238.75, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 270.75, "r": 264.64, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 270.75, "r": 289.23, "b": 275.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 55.53, "t": 279.01, "r": 68.69, "b": 283.37, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 277.98, "r": 190.86, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 208.99, "t": 277.98, "r": 214.16, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 233.58, "t": 277.98, "r": 238.75, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 256.88, "t": 277.98, "r": 264.64, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 282.77, "t": 277.98, "r": 287.94, "b": 282.34, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 169.62, "t": 286.45, "r": 174.8, "b": 290.63, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 183.11, "t": 285.47, "r": 190.86, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 207.7, "t": 285.47, "r": 215.45, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 232.29, "t": 285.47, "r": 240.04, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 255.77, "t": 285.47, "r": 265.75, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 281.48, "t": 285.47, "r": 289.23, "b": 289.82, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 16, "page_no": 7, "cluster": { "id": 16, "label": "caption", "bbox": { "l": 380.43, "t": 292.3, "r": 549.42, "b": 298.6, "coord_origin": "TOPLEFT" }, "confidence": 0.75, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.43, "r_y0": 298.6, "r_x1": 549.42, "r_y1": 298.6, "r_x2": 549.42, "r_y2": 292.3, "r_x3": 380.43, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Text is aligned to match original for ease of viewing" }, { "label": "table", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "table", "bbox": { "l": 304.92, "t": 218.51, "r": 550.23, "b": 287.9, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 125, "label": "text", "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.05, "r_y0": 226.69, "r_x1": 542.0, "r_y1": 226.69, "r_x2": 542.0, "r_y2": 221.62, "r_x3": 459.05, "r_y3": 221.62, "coord_origin": "TOPLEFT" }, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 493.82, "t": 227.83, "r": 507.23, "b": 232.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 493.82, "r_y0": 232.9, "r_x1": 507.23, "r_y1": 232.9, "r_x2": 507.23, "r_y2": 227.83, "r_x3": 493.82, "r_y3": 227.83, "coord_origin": "TOPLEFT" }, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.24, "r_y0": 241.81, "r_x1": 400.75, "r_y1": 241.81, "r_x2": 400.75, "r_y2": 236.75, "r_x3": 393.24, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RS", "orig": "RS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 400.75, "t": 236.75, "r": 404.65, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 241.81, "r_x1": 404.65, "r_y1": 241.81, "r_x2": 404.65, "r_y2": 236.75, "r_x3": 400.75, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 404.65, "t": 236.75, "r": 407.35, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.65, "r_y0": 241.81, "r_x1": 407.35, "r_y1": 241.81, "r_x2": 407.35, "r_y2": 236.75, "r_x3": 404.65, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.1, "r_y0": 226.64, "r_x1": 438.01, "r_y1": 226.64, "r_x2": 438.01, "r_y2": 221.57, "r_x3": 392.1, "r_y3": 221.57, "coord_origin": "TOPLEFT" }, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.18, "r_y0": 241.81, "r_x1": 440.99, "r_y1": 241.81, "r_x2": 440.99, "r_y2": 236.75, "r_x3": 427.18, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.38, "r_y0": 241.81, "r_x1": 482.48, "r_y1": 241.81, "r_x2": 482.48, "r_y2": 236.75, "r_x3": 468.38, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.93, "r_y0": 241.81, "r_x1": 530.73, "r_y1": 241.81, "r_x2": 530.73, "r_y2": 236.75, "r_x3": 516.93, "r_y3": 236.75, "coord_origin": "TOPLEFT" }, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 249.68, "r_x1": 355.65, "r_y1": 249.68, "r_x2": 355.65, "r_y2": 244.61, "r_x3": 306.11, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "Nonvested on Janua", "orig": "Nonvested on Janua", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 355.65, "t": 244.61, "r": 364.66, "b": 249.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 355.65, "r_y0": 249.68, "r_x1": 364.66, "r_y1": 249.68, "r_x2": 364.66, "r_y2": 244.61, "r_x3": 355.65, "r_y3": 244.61, "coord_origin": "TOPLEFT" }, "text": "ry 1", "orig": "ry 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 249.98, "r_x1": 400.75, "r_y1": 249.98, "r_x2": 400.75, "r_y2": 244.91, "r_x3": 396.25, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 400.75, "t": 244.91, "r": 403.76, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 249.98, "r_x1": 403.76, "r_y1": 249.98, "r_x2": 403.76, "r_y2": 244.91, "r_x3": 400.75, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 249.98, "r_x1": 437.33, "r_y1": 249.98, "r_x2": 437.33, "r_y2": 244.91, "r_x3": 429.82, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.53, "r_y0": 249.98, "r_x1": 478.4, "r_y1": 249.98, "r_x2": 478.4, "r_y2": 244.91, "r_x3": 465.53, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "90.10", "orig": "90.10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 480.98, "t": 244.91, "r": 483.55, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 480.98, "r_y0": 249.98, "r_x1": 483.55, "r_y1": 249.98, "r_x2": 483.55, "r_y2": 244.91, "r_x3": 480.98, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$", "orig": "$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 513.45, "r_y0": 249.98, "r_x1": 531.47, "r_y1": 249.98, "r_x2": 531.47, "r_y2": 244.91, "r_x3": 513.45, "r_y3": 244.91, "coord_origin": "TOPLEFT" }, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 258.75, "r_x1": 325.63, "r_y1": 258.75, "r_x2": 325.63, "r_y2": 253.68, "r_x3": 306.11, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 258.75, "r_x1": 400.75, "r_y1": 258.75, "r_x2": 400.75, "r_y2": 253.68, "r_x3": 396.25, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.", "orig": "0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 400.75, "t": 253.68, "r": 403.76, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.75, "r_y0": 258.75, "r_x1": 403.76, "r_y1": 258.75, "r_x2": 403.76, "r_y2": 253.68, "r_x3": 400.75, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.82, "r_y0": 258.75, "r_x1": 437.33, "r_y1": 258.75, "r_x2": 437.33, "r_y2": 253.68, "r_x3": 429.82, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.44, "r_y0": 258.75, "r_x1": 482.55, "r_y1": 258.75, "r_x2": 482.55, "r_y2": 253.68, "r_x3": 466.44, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 514.29, "r_y0": 258.75, "r_x1": 530.81, "r_y1": 258.75, "r_x2": 530.81, "r_y2": 253.68, "r_x3": 514.29, "r_y3": 253.68, "coord_origin": "TOPLEFT" }, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 266.61, "r_x1": 322.63, "r_y1": 266.61, "r_x2": 322.63, "r_y2": 261.55, "r_x3": 306.11, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 266.61, "r_x1": 400.74, "r_y1": 266.61, "r_x2": 400.74, "r_y2": 261.55, "r_x3": 394.43, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 400.73, "t": 261.55, "r": 403.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 266.61, "r_x1": 403.74, "r_y1": 266.61, "r_x2": 403.74, "r_y2": 261.55, "r_x3": 400.73, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 403.74, "t": 261.55, "r": 405.54, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 266.61, "r_x1": 405.54, "r_y1": 266.61, "r_x2": 405.54, "r_y2": 261.55, "r_x3": 403.74, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.7, "r_y0": 266.61, "r_x1": 438.81, "r_y1": 266.61, "r_x2": 438.81, "r_y2": 261.55, "r_x3": 427.7, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 468.56, "r_y0": 266.61, "r_x1": 482.07, "r_y1": 266.61, "r_x2": 482.07, "r_y2": 261.55, "r_x3": 468.56, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 266.61, "r_x1": 529.53, "r_y1": 266.61, "r_x2": 529.53, "r_y2": 261.55, "r_x3": 516.02, "r_y3": 261.55, "coord_origin": "TOPLEFT" }, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 155, "label": "text", "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 274.71, "r_x1": 356.25, "r_y1": 274.71, "r_x2": 356.25, "r_y2": 269.64, "r_x3": 306.11, "r_y3": 269.64, "coord_origin": "TOPLEFT" }, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.43, "r_y0": 275.38, "r_x1": 400.74, "r_y1": 275.38, "r_x2": 400.74, "r_y2": 270.32, "r_x3": 394.43, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "(0.", "orig": "(0.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 157, "label": "text", "bbox": { "l": 400.73, "t": 270.32, "r": 403.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.73, "r_y0": 275.38, "r_x1": 403.74, "r_y1": 275.38, "r_x2": 403.74, "r_y2": 270.32, "r_x3": 400.73, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 158, "label": "text", "bbox": { "l": 403.74, "t": 270.32, "r": 405.54, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.74, "r_y0": 275.38, "r_x1": 405.54, "r_y1": 275.38, "r_x2": 405.54, "r_y2": 270.32, "r_x3": 403.74, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 159, "label": "text", "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.03, "r_y0": 275.38, "r_x1": 436.43, "r_y1": 275.38, "r_x2": 436.43, "r_y2": 270.32, "r_x3": 431.03, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 160, "label": "text", "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.83, "r_y0": 275.38, "r_x1": 482.35, "r_y1": 275.38, "r_x2": 482.35, "r_y2": 270.32, "r_x3": 465.83, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 161, "label": "text", "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 516.02, "r_y0": 275.38, "r_x1": 529.53, "r_y1": 275.38, "r_x2": 529.53, "r_y2": 270.32, "r_x3": 516.02, "r_y3": 270.32, "coord_origin": "TOPLEFT" }, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 162, "label": "text", "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.11, "r_y0": 283.55, "r_x1": 373.36, "r_y1": 283.55, "r_x2": 373.36, "r_y2": 278.49, "r_x3": 306.11, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 163, "label": "text", "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.25, "r_y0": 283.55, "r_x1": 403.76, "r_y1": 283.55, "r_x2": 403.76, "r_y2": 278.49, "r_x3": 396.25, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 164, "label": "text", "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.52, "r_y0": 283.55, "r_x1": 437.02, "r_y1": 283.55, "r_x2": 437.02, "r_y2": 278.49, "r_x3": 429.52, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 165, "label": "text", "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.71, "r_y0": 283.55, "r_x1": 484.74, "r_y1": 283.55, "r_x2": 484.74, "r_y2": 278.49, "r_x3": 463.71, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 166, "label": "text", "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 512.99, "r_y0": 283.55, "r_x1": 534.02, "r_y1": 283.55, "r_x2": 534.02, "r_y2": 278.49, "r_x3": 512.99, "r_y3": 278.49, "coord_origin": "TOPLEFT" }, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 7, "num_cols": 5, "table_cells": [ { "bbox": { "l": 459.05, "t": 221.62, "r": 542.0, "b": 226.69, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 393.24, "t": 236.75, "r": 400.75, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RS U s", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 392.1, "t": 221.57, "r": 438.01, "b": 226.64, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.18, "t": 236.75, "r": 440.99, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 468.38, "t": 236.75, "r": 482.48, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 516.93, "t": 236.75, "r": 530.73, "b": 241.81, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 244.61, "r": 355.65, "b": 249.68, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on Janua ry 1", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 244.91, "r": 400.75, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1. 1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 244.91, "r": 437.33, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.53, "t": 244.91, "r": 478.4, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 513.45, "t": 244.91, "r": 531.47, "b": 249.98, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 253.68, "r": 325.63, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 253.68, "r": 400.75, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0. 5", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.82, "t": 253.68, "r": 437.33, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 466.44, "t": 253.68, "r": 482.55, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 514.29, "t": 253.68, "r": 530.81, "b": 258.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 261.55, "r": 322.63, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 261.55, "r": 400.74, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 5 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 427.7, "t": 261.55, "r": 438.81, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 468.56, "t": 261.55, "r": 482.07, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 261.55, "r": 529.53, "b": 266.61, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 269.64, "r": 356.25, "b": 274.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 394.43, "t": 270.32, "r": 400.74, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0. 1 )", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 431.03, "t": 270.32, "r": 436.43, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 465.83, "t": 270.32, "r": 482.35, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 516.02, "t": 270.32, "r": 529.53, "b": 275.38, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 306.11, "t": 278.49, "r": 373.36, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false }, { "bbox": { "l": 396.25, "t": 278.49, "r": 403.76, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 429.52, "t": 278.49, "r": 437.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 463.71, "t": 278.49, "r": 484.74, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 512.99, "t": 278.49, "r": 534.02, "b": 283.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "caption", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 50.11, "t": 320.88, "r": 545.11, "b": 365.65, "coord_origin": "TOPLEFT" }, "confidence": 0.914, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 329.78, "r_x1": 86.86, "r_y1": 329.78, "r_x2": 86.86, "r_y2": 320.88, "r_x3": 50.11, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 93.92, "r_y0": 329.78, "r_x1": 545.11, "r_y1": 329.78, "r_x2": 545.11, "r_y2": 320.88, "r_x3": 93.92, "r_y3": 320.88, "coord_origin": "TOPLEFT" }, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 341.74, "r_x1": 545.11, "r_y1": 341.74, "r_x2": 545.11, "r_y2": 332.83, "r_x3": 50.11, "r_y3": 332.83, "coord_origin": "TOPLEFT" }, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 353.69, "r_x1": 545.11, "r_y1": 353.69, "r_x2": 545.11, "r_y2": 344.79, "r_x3": 50.11, "r_y3": 344.79, "coord_origin": "TOPLEFT" }, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.65, "r_x1": 139.8, "r_y1": 365.65, "r_x2": 139.8, "r_y2": 356.74, "r_x3": 50.11, "r_y3": 356.74, "coord_origin": "TOPLEFT" }, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset." }, { "label": "picture", "id": 12, "page_no": 7, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 216.77, "t": 380.49, "r": 375.78, "b": 443.35, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 167, "label": "text", "bbox": { "l": 220.26, "t": 381.78, "r": 342.08, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.26, "r_y0": 386.44, "r_x1": 342.08, "r_y1": 386.44, "r_x2": 342.08, "r_y2": 381.78, "r_x3": 220.26, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 11, "page_no": 7, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 51.74, "t": 380.48, "r": 211.84, "b": 443.66, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 168, "label": "text", "bbox": { "l": 53.72, "t": 381.78, "r": 85.66, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.72, "r_y0": 386.44, "r_x1": 85.66, "r_y1": 386.44, "r_x2": 85.66, "r_y2": 381.78, "r_x3": 53.72, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 13, "page_no": 7, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 383.14, "t": 381.23, "r": 542.11, "b": 442.77, "coord_origin": "TOPLEFT" }, "confidence": 0.788, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 169, "label": "text", "bbox": { "l": 437.38, "t": 400.55, "r": 443.7, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 406.87, "r_x1": 443.7, "r_y1": 406.87, "r_x2": 443.7, "r_y2": 400.55, "r_x3": 437.38, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 170, "label": "text", "bbox": { "l": 450.33, "t": 400.55, "r": 456.65, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 406.87, "r_x1": 456.65, "r_y1": 406.87, "r_x2": 456.65, "r_y2": 400.55, "r_x3": 450.33, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 171, "label": "text", "bbox": { "l": 463.28, "t": 400.55, "r": 469.6, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 406.87, "r_x1": 469.6, "r_y1": 406.87, "r_x2": 469.6, "r_y2": 400.55, "r_x3": 463.28, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 172, "label": "text", "bbox": { "l": 476.24, "t": 400.55, "r": 482.56, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 406.87, "r_x1": 482.56, "r_y1": 406.87, "r_x2": 482.56, "r_y2": 400.55, "r_x3": 476.24, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 173, "label": "text", "bbox": { "l": 489.19, "t": 400.55, "r": 495.51, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 406.87, "r_x1": 495.51, "r_y1": 406.87, "r_x2": 495.51, "r_y2": 400.55, "r_x3": 489.19, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 174, "label": "text", "bbox": { "l": 502.14, "t": 400.55, "r": 508.46, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 406.87, "r_x1": 508.46, "r_y1": 406.87, "r_x2": 508.46, "r_y2": 400.55, "r_x3": 502.14, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 175, "label": "text", "bbox": { "l": 515.1, "t": 400.55, "r": 521.41, "b": 406.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 406.87, "r_x1": 521.41, "r_y1": 406.87, "r_x2": 521.41, "r_y2": 400.55, "r_x3": 515.1, "r_y3": 400.55, "coord_origin": "TOPLEFT" }, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 176, "label": "text", "bbox": { "l": 385.28, "t": 411.04, "r": 391.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 417.36, "r_x1": 391.6, "r_y1": 417.36, "r_x2": 391.6, "r_y2": 411.04, "r_x3": 385.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 177, "label": "text", "bbox": { "l": 398.52, "t": 411.04, "r": 404.84, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 417.36, "r_x1": 404.84, "r_y1": 417.36, "r_x2": 404.84, "r_y2": 411.04, "r_x3": 398.52, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 178, "label": "text", "bbox": { "l": 411.48, "t": 411.04, "r": 417.8, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 417.36, "r_x1": 417.8, "r_y1": 417.36, "r_x2": 417.8, "r_y2": 411.04, "r_x3": 411.48, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 179, "label": "text", "bbox": { "l": 437.38, "t": 411.04, "r": 443.7, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 417.36, "r_x1": 443.7, "r_y1": 417.36, "r_x2": 443.7, "r_y2": 411.04, "r_x3": 437.38, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 180, "label": "text", "bbox": { "l": 450.33, "t": 411.04, "r": 456.65, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 417.36, "r_x1": 456.65, "r_y1": 417.36, "r_x2": 456.65, "r_y2": 411.04, "r_x3": 450.33, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 181, "label": "text", "bbox": { "l": 463.28, "t": 411.04, "r": 469.6, "b": 417.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 417.36, "r_x1": 469.6, "r_y1": 417.36, "r_x2": 469.6, "r_y2": 411.04, "r_x3": 463.28, "r_y3": 411.04, "coord_origin": "TOPLEFT" }, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 182, "label": "text", "bbox": { "l": 385.28, "t": 421.07, "r": 391.6, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 427.39, "r_x1": 391.6, "r_y1": 427.39, "r_x2": 391.6, "r_y2": 421.07, "r_x3": 385.28, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 183, "label": "text", "bbox": { "l": 398.52, "t": 421.07, "r": 404.84, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 427.39, "r_x1": 404.84, "r_y1": 427.39, "r_x2": 404.84, "r_y2": 421.07, "r_x3": 398.52, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 184, "label": "text", "bbox": { "l": 411.48, "t": 421.07, "r": 417.8, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 427.39, "r_x1": 417.8, "r_y1": 427.39, "r_x2": 417.8, "r_y2": 421.07, "r_x3": 411.48, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 185, "label": "text", "bbox": { "l": 424.43, "t": 421.07, "r": 430.75, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 427.39, "r_x1": 430.75, "r_y1": 427.39, "r_x2": 430.75, "r_y2": 421.07, "r_x3": 424.43, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 186, "label": "text", "bbox": { "l": 437.38, "t": 421.07, "r": 443.7, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 427.39, "r_x1": 443.7, "r_y1": 427.39, "r_x2": 443.7, "r_y2": 421.07, "r_x3": 437.38, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 187, "label": "text", "bbox": { "l": 450.33, "t": 421.07, "r": 456.65, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 427.39, "r_x1": 456.65, "r_y1": 427.39, "r_x2": 456.65, "r_y2": 421.07, "r_x3": 450.33, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 188, "label": "text", "bbox": { "l": 463.29, "t": 421.07, "r": 469.61, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 427.39, "r_x1": 469.61, "r_y1": 427.39, "r_x2": 469.61, "r_y2": 421.07, "r_x3": 463.29, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 189, "label": "text", "bbox": { "l": 476.24, "t": 421.07, "r": 482.56, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 427.39, "r_x1": 482.56, "r_y1": 427.39, "r_x2": 482.56, "r_y2": 421.07, "r_x3": 476.24, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 190, "label": "text", "bbox": { "l": 489.19, "t": 421.07, "r": 495.51, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 427.39, "r_x1": 495.51, "r_y1": 427.39, "r_x2": 495.51, "r_y2": 421.07, "r_x3": 489.19, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 191, "label": "text", "bbox": { "l": 502.14, "t": 421.07, "r": 508.46, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 427.39, "r_x1": 508.46, "r_y1": 427.39, "r_x2": 508.46, "r_y2": 421.07, "r_x3": 502.14, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 192, "label": "text", "bbox": { "l": 515.1, "t": 421.07, "r": 521.42, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 427.39, "r_x1": 521.42, "r_y1": 427.39, "r_x2": 521.42, "r_y2": 421.07, "r_x3": 515.1, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 193, "label": "text", "bbox": { "l": 528.05, "t": 421.07, "r": 534.37, "b": 427.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 427.39, "r_x1": 534.37, "r_y1": 427.39, "r_x2": 534.37, "r_y2": 421.07, "r_x3": 528.05, "r_y3": 421.07, "coord_origin": "TOPLEFT" }, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 194, "label": "text", "bbox": { "l": 385.28, "t": 432.04, "r": 391.6, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 438.36, "r_x1": 391.6, "r_y1": 438.36, "r_x2": 391.6, "r_y2": 432.04, "r_x3": 385.28, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 195, "label": "text", "bbox": { "l": 398.52, "t": 432.04, "r": 404.84, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 438.36, "r_x1": 404.84, "r_y1": 438.36, "r_x2": 404.84, "r_y2": 432.04, "r_x3": 398.52, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 196, "label": "text", "bbox": { "l": 411.48, "t": 432.04, "r": 417.8, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 438.36, "r_x1": 417.8, "r_y1": 438.36, "r_x2": 417.8, "r_y2": 432.04, "r_x3": 411.48, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 197, "label": "text", "bbox": { "l": 424.43, "t": 432.04, "r": 430.75, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 438.36, "r_x1": 430.75, "r_y1": 438.36, "r_x2": 430.75, "r_y2": 432.04, "r_x3": 424.43, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 198, "label": "text", "bbox": { "l": 437.38, "t": 432.04, "r": 443.7, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 438.36, "r_x1": 443.7, "r_y1": 438.36, "r_x2": 443.7, "r_y2": 432.04, "r_x3": 437.38, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 199, "label": "text", "bbox": { "l": 450.33, "t": 432.04, "r": 456.65, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 438.36, "r_x1": 456.65, "r_y1": 438.36, "r_x2": 456.65, "r_y2": 432.04, "r_x3": 450.33, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 200, "label": "text", "bbox": { "l": 463.29, "t": 432.04, "r": 469.61, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.29, "r_y0": 438.36, "r_x1": 469.61, "r_y1": 438.36, "r_x2": 469.61, "r_y2": 432.04, "r_x3": 463.29, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 201, "label": "text", "bbox": { "l": 476.24, "t": 432.04, "r": 482.56, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 438.36, "r_x1": 482.56, "r_y1": 438.36, "r_x2": 482.56, "r_y2": 432.04, "r_x3": 476.24, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 202, "label": "text", "bbox": { "l": 489.19, "t": 432.04, "r": 495.51, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 438.36, "r_x1": 495.51, "r_y1": 438.36, "r_x2": 495.51, "r_y2": 432.04, "r_x3": 489.19, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 203, "label": "text", "bbox": { "l": 502.14, "t": 432.04, "r": 508.46, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 438.36, "r_x1": 508.46, "r_y1": 438.36, "r_x2": 508.46, "r_y2": 432.04, "r_x3": 502.14, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 204, "label": "text", "bbox": { "l": 515.1, "t": 432.04, "r": 521.42, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.1, "r_y0": 438.36, "r_x1": 521.42, "r_y1": 438.36, "r_x2": 521.42, "r_y2": 432.04, "r_x3": 515.1, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 205, "label": "text", "bbox": { "l": 528.05, "t": 432.04, "r": 534.37, "b": 438.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.05, "r_y0": 438.36, "r_x1": 534.37, "r_y1": 438.36, "r_x2": 534.37, "r_y2": 432.04, "r_x3": 528.05, "r_y3": 432.04, "coord_origin": "TOPLEFT" }, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 206, "label": "text", "bbox": { "l": 385.28, "t": 389.2, "r": 388.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 395.52, "r_x1": 388.44, "r_y1": 395.52, "r_x2": 388.44, "r_y2": 389.2, "r_x3": 385.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 207, "label": "text", "bbox": { "l": 398.52, "t": 389.2, "r": 401.68, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 395.52, "r_x1": 401.68, "r_y1": 395.52, "r_x2": 401.68, "r_y2": 389.2, "r_x3": 398.52, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 208, "label": "text", "bbox": { "l": 411.48, "t": 389.2, "r": 414.63, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 395.52, "r_x1": 414.63, "r_y1": 395.52, "r_x2": 414.63, "r_y2": 389.2, "r_x3": 411.48, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 209, "label": "text", "bbox": { "l": 424.43, "t": 389.2, "r": 427.59, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 395.52, "r_x1": 427.59, "r_y1": 395.52, "r_x2": 427.59, "r_y2": 389.2, "r_x3": 424.43, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 210, "label": "text", "bbox": { "l": 437.38, "t": 389.2, "r": 440.54, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.38, "r_y0": 395.52, "r_x1": 440.54, "r_y1": 395.52, "r_x2": 440.54, "r_y2": 389.2, "r_x3": 437.38, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 211, "label": "text", "bbox": { "l": 450.33, "t": 389.2, "r": 453.49, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 450.33, "r_y0": 395.52, "r_x1": 453.49, "r_y1": 395.52, "r_x2": 453.49, "r_y2": 389.2, "r_x3": 450.33, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 212, "label": "text", "bbox": { "l": 463.28, "t": 389.2, "r": 466.44, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 463.28, "r_y0": 395.52, "r_x1": 466.44, "r_y1": 395.52, "r_x2": 466.44, "r_y2": 389.2, "r_x3": 463.28, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 213, "label": "text", "bbox": { "l": 476.24, "t": 389.2, "r": 479.39, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.24, "r_y0": 395.52, "r_x1": 479.39, "r_y1": 395.52, "r_x2": 479.39, "r_y2": 389.2, "r_x3": 476.24, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 214, "label": "text", "bbox": { "l": 489.19, "t": 389.2, "r": 492.35, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.19, "r_y0": 395.52, "r_x1": 492.35, "r_y1": 395.52, "r_x2": 492.35, "r_y2": 389.2, "r_x3": 489.19, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 215, "label": "text", "bbox": { "l": 502.14, "t": 389.2, "r": 505.3, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.14, "r_y0": 395.52, "r_x1": 505.3, "r_y1": 395.52, "r_x2": 505.3, "r_y2": 389.2, "r_x3": 502.14, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 216, "label": "text", "bbox": { "l": 515.09, "t": 389.2, "r": 521.41, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 515.09, "r_y0": 395.52, "r_x1": 521.41, "r_y1": 395.52, "r_x2": 521.41, "r_y2": 389.2, "r_x3": 515.09, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 217, "label": "text", "bbox": { "l": 528.04, "t": 389.2, "r": 534.13, "b": 395.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 528.04, "r_y0": 395.52, "r_x1": 534.13, "r_y1": 395.52, "r_x2": 534.13, "r_y2": 389.2, "r_x3": 528.04, "r_y3": 389.2, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 218, "label": "text", "bbox": { "l": 385.28, "t": 398.97, "r": 391.6, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.28, "r_y0": 405.29, "r_x1": 391.6, "r_y1": 405.29, "r_x2": 391.6, "r_y2": 398.97, "r_x3": 385.28, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 219, "label": "text", "bbox": { "l": 398.52, "t": 398.97, "r": 404.84, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.52, "r_y0": 405.29, "r_x1": 404.84, "r_y1": 405.29, "r_x2": 404.84, "r_y2": 398.97, "r_x3": 398.52, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 220, "label": "text", "bbox": { "l": 411.48, "t": 398.97, "r": 417.8, "b": 405.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.48, "r_y0": 405.29, "r_x1": 417.8, "r_y1": 405.29, "r_x2": 417.8, "r_y2": 398.97, "r_x3": 411.48, "r_y3": 398.97, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 221, "label": "text", "bbox": { "l": 424.43, "t": 406.77, "r": 430.75, "b": 413.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.43, "r_y0": 413.09, "r_x1": 430.75, "r_y1": 413.09, "r_x2": 430.75, "r_y2": 406.77, "r_x3": 424.43, "r_y3": 406.77, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 222, "label": "text", "bbox": { "l": 502.87, "t": 410.99, "r": 509.19, "b": 417.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 502.87, "r_y0": 417.31, "r_x1": 509.19, "r_y1": 417.31, "r_x2": 509.19, "r_y2": 410.99, "r_x3": 502.87, "r_y3": 410.99, "coord_origin": "TOPLEFT" }, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 223, "label": "text", "bbox": { "l": 384.35, "t": 381.78, "r": 430.99, "b": 386.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.35, "r_y0": 386.44, "r_x1": 430.99, "r_y1": 386.44, "r_x2": 430.99, "r_y2": 381.78, "r_x3": 384.35, "r_y3": 381.78, "coord_origin": "TOPLEFT" }, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 62.6, "t": 458.73, "r": 532.63, "b": 467.63, "coord_origin": "TOPLEFT" }, "confidence": 0.915, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.6, "r_y0": 467.63, "r_x1": 532.63, "r_y1": 467.63, "r_x2": 532.63, "r_y2": 458.73, "r_x3": 62.6, "r_y3": 458.73, "coord_origin": "TOPLEFT" }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 50.11, "t": 491.4, "r": 163.76, "b": 501.25, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 501.25, "r_x1": 64.45, "r_y1": 501.25, "r_x2": 64.45, "r_y2": 491.4, "r_x3": 50.11, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "5.5.", "orig": "5.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.01, "r_y0": 501.25, "r_x1": 163.76, "r_y1": 501.25, "r_x2": 163.76, "r_y2": 491.4, "r_x3": 74.01, "r_y3": 491.4, "coord_origin": "TOPLEFT" }, "text": "Qualitative Analysis", "orig": "Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.5. Qualitative Analysis" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 536.87, "r": 286.37, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 545.78, "r_x1": 286.36, "r_y1": 545.78, "r_x2": 286.36, "r_y2": 536.87, "r_x3": 62.07, "r_y3": 536.87, "coord_origin": "TOPLEFT" }, "text": "We showcase several visualizations for the different", "orig": "We showcase several visualizations for the different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 557.73, "r_x1": 211.16, "r_y1": 557.73, "r_x2": 211.16, "r_y2": 548.83, "r_x3": 50.11, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.1, "r_y0": 557.51, "r_x1": 259.17, "r_y1": 557.51, "r_x2": 259.17, "r_y2": 548.92, "r_x3": 215.1, "r_y3": 548.92, "coord_origin": "TOPLEFT" }, "text": "\u201ccomplex\u201d", "orig": "\u201ccomplex\u201d", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.12, "r_y0": 557.73, "r_x1": 286.36, "r_y1": 557.73, "r_x2": 286.36, "r_y2": 548.83, "r_x3": 263.12, "r_y3": 548.83, "coord_origin": "TOPLEFT" }, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 569.69, "r_x1": 286.37, "r_y1": 569.69, "r_x2": 286.37, "r_y2": 560.78, "r_x3": 50.11, "r_y3": 560.78, "coord_origin": "TOPLEFT" }, "text": "within datasets presented in this work in Fig. 5 and Fig. 6", "orig": "within datasets presented in this work in Fig. 5 and Fig. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 581.64, "r_x1": 286.37, "r_y1": 581.64, "r_x2": 286.37, "r_y2": 572.74, "r_x3": 50.11, "r_y3": 572.74, "coord_origin": "TOPLEFT" }, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 593.6, "r_x1": 286.37, "r_y1": 593.6, "r_x2": 286.37, "r_y2": 584.69, "r_x3": 50.11, "r_y3": 584.69, "coord_origin": "TOPLEFT" }, "text": "for all table cells, even for the empty ones. Additionally,", "orig": "for all table cells, even for the empty ones. Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 605.56, "r_x1": 286.37, "r_y1": 605.56, "r_x2": 286.37, "r_y2": 596.65, "r_x3": 50.11, "r_y3": 596.65, "coord_origin": "TOPLEFT" }, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 617.51, "r_x1": 286.37, "r_y1": 617.51, "r_x2": 286.37, "r_y2": 608.6, "r_x3": 50.11, "r_y3": 608.6, "coord_origin": "TOPLEFT" }, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 629.47, "r_x1": 286.37, "r_y1": 629.47, "r_x2": 286.37, "r_y2": 620.56, "r_x3": 50.11, "r_y3": 620.56, "coord_origin": "TOPLEFT" }, "text": "based on their overlap and spatial proximity. The left part", "orig": "based on their overlap and spatial proximity. The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 641.42, "r_x1": 286.37, "r_y1": 641.42, "r_x2": 286.37, "r_y2": 632.51, "r_x3": 50.11, "r_y3": 632.51, "coord_origin": "TOPLEFT" }, "text": "of Fig. 5 demonstrates also the adaptability of our method", "orig": "of Fig. 5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 653.38, "r_x1": 286.37, "r_y1": 653.38, "r_x2": 286.37, "r_y2": 644.47, "r_x3": 50.11, "r_y3": 644.47, "coord_origin": "TOPLEFT" }, "text": "to any language, as it can successfully extract Japanese", "orig": "to any language, as it can successfully extract Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 665.33, "r_x1": 286.37, "r_y1": 665.33, "r_x2": 286.37, "r_y2": 656.42, "r_x3": 50.11, "r_y3": 656.42, "coord_origin": "TOPLEFT" }, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 677.29, "r_x1": 286.37, "r_y1": 677.29, "r_x2": 286.37, "r_y2": 668.38, "r_x3": 50.11, "r_y3": 668.38, "coord_origin": "TOPLEFT" }, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 689.24, "r_x1": 286.37, "r_y1": 689.24, "r_x2": 286.37, "r_y2": 680.34, "r_x3": 50.11, "r_y3": 680.34, "coord_origin": "TOPLEFT" }, "text": "steps in the supplementary material. Overall these illustra-", "orig": "steps in the supplementary material. Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.2, "r_x1": 286.37, "r_y1": 701.2, "r_x2": 286.37, "r_y2": 692.29, "r_x3": 50.11, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 226.89, "r_y1": 713.15, "r_x2": 226.89, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type." }, { "label": "section_header", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 308.86, "t": 490.71, "r": 460.85, "b": 501.46, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 201, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 501.46, "r_x1": 316.07, "r_y1": 501.46, "r_x2": 316.07, "r_y2": 490.71, "r_x3": 308.86, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 202, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 325.69, "r_y0": 501.46, "r_x1": 460.85, "r_y1": 501.46, "r_x2": 460.85, "r_y2": 490.71, "r_x3": 325.69, "r_y3": 490.71, "coord_origin": "TOPLEFT" }, "text": "Future Work & Conclusion", "orig": "Future Work & Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Future Work & Conclusion" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 308.86, "t": 512.89, "r": 545.12, "b": 653.31, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 203, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 521.8, "r_x1": 545.12, "r_y1": 521.8, "r_x2": 545.12, "r_y2": 512.89, "r_x3": 320.82, "r_y3": 512.89, "coord_origin": "TOPLEFT" }, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 204, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 533.75, "r_x1": 545.12, "r_y1": 533.75, "r_x2": 545.12, "r_y2": 524.85, "r_x3": 308.86, "r_y3": 524.85, "coord_origin": "TOPLEFT" }, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 205, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.71, "r_x1": 545.12, "r_y1": 545.71, "r_x2": 545.12, "r_y2": 536.8, "r_x3": 308.86, "r_y3": 536.8, "coord_origin": "TOPLEFT" }, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 206, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 557.66, "r_x1": 545.12, "r_y1": 557.66, "r_x2": 545.12, "r_y2": 548.76, "r_x3": 308.86, "r_y3": 548.76, "coord_origin": "TOPLEFT" }, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 207, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.62, "r_x1": 545.12, "r_y1": 569.62, "r_x2": 545.12, "r_y2": 560.71, "r_x3": 308.86, "r_y3": 560.71, "coord_origin": "TOPLEFT" }, "text": "content from PDF or OCR by using bounding boxes. Ad-", "orig": "content from PDF or OCR by using bounding boxes. Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 208, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 581.57, "r_x1": 545.12, "r_y1": 581.57, "r_x2": 545.12, "r_y2": 572.67, "r_x3": 308.86, "r_y3": 572.67, "coord_origin": "TOPLEFT" }, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 209, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 593.53, "r_x1": 545.12, "r_y1": 593.53, "r_x2": 545.12, "r_y2": 584.62, "r_x3": 308.86, "r_y3": 584.62, "coord_origin": "TOPLEFT" }, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 210, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 605.49, "r_x1": 400.47, "r_y1": 605.49, "r_x2": 400.47, "r_y2": 596.58, "r_x3": 308.86, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "ments, and languages.", "orig": "ments, and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 211, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.38, "r_y0": 605.49, "r_x1": 545.12, "r_y1": 605.49, "r_x2": 545.12, "r_y2": 596.58, "r_x3": 408.38, "r_y3": 596.58, "coord_origin": "TOPLEFT" }, "text": "Furthermore, our method outper-", "orig": "Furthermore, our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 212, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 617.44, "r_x1": 545.12, "r_y1": 617.44, "r_x2": 545.12, "r_y2": 608.53, "r_x3": 308.86, "r_y3": 608.53, "coord_origin": "TOPLEFT" }, "text": "forms all state-of-the-arts with a wide margin. Finally, we", "orig": "forms all state-of-the-arts with a wide margin. Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 213, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 629.4, "r_x1": 545.12, "r_y1": 629.4, "r_x2": 545.12, "r_y2": 620.49, "r_x3": 308.86, "r_y3": 620.49, "coord_origin": "TOPLEFT" }, "text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 214, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 641.35, "r_x1": 545.12, "r_y1": 641.35, "r_x2": 545.12, "r_y2": 632.44, "r_x3": 308.86, "r_y3": 632.44, "coord_origin": "TOPLEFT" }, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 215, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 653.31, "r_x1": 365.86, "r_y1": 653.31, "r_x2": 365.86, "r_y2": 644.4, "r_x3": 308.86, "r_y3": 644.4, "coord_origin": "TOPLEFT" }, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 308.86, "t": 672.1, "r": 364.41, "b": 682.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 216, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 682.85, "r_x1": 364.41, "r_y1": 682.85, "r_x2": 364.41, "r_y2": 672.1, "r_x3": 308.86, "r_y3": 672.1, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 10, "page_no": 7, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 313.35, "t": 693.96, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.832, "cells": [ { "index": 217, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 313.35, "r_y0": 701.98, "r_x1": 323.81, "r_y1": 701.98, "r_x2": 323.81, "r_y2": 693.96, "r_x3": 313.35, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 218, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.05, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 326.05, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 219, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 545.11, "r_y1": 712.94, "r_x2": 545.11, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-" }, { "label": "picture", "id": 15, "page_no": 7, "cluster": { "id": 15, "label": "picture", "bbox": { "l": 305.58, "t": 98.65, "r": 554.83, "b": 180.63, "coord_origin": "TOPLEFT" }, "confidence": 0.77, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 14, "page_no": 7, "cluster": { "id": 14, "label": "picture", "bbox": { "l": 49.98, "t": 103.71, "r": 301.63, "b": 187.58, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.871, "cells": [ { "index": 220, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" } ] } }, { "page_no": 8, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 70.03, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 286.36, "r_y1": 94.86, "r_x2": 286.36, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 105.82, "r_x1": 85.72, "r_y1": 105.82, "r_x2": 85.72, "r_y2": 97.8, "r_x3": 70.03, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.89, "r_y0": 105.61, "r_x1": 199.93, "r_y1": 105.61, "r_x2": 199.93, "r_y2": 97.88, "r_x3": 87.89, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.94, "r_y0": 105.82, "r_x1": 286.36, "r_y1": 105.82, "r_x2": 286.36, "r_y2": 97.8, "r_x3": 199.94, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 116.78, "r_x1": 221.95, "r_y1": 116.78, "r_x2": 221.95, "r_y2": 108.76, "r_x3": 70.03, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 128.05, "r_x1": 65.21, "r_y1": 128.05, "r_x2": 65.21, "r_y2": 120.03, "r_x3": 54.6, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.48, "r_y0": 128.05, "r_x1": 286.36, "r_y1": 128.05, "r_x2": 286.36, "r_y2": 120.03, "r_x3": 67.48, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.01, "r_x1": 179.67, "r_y1": 139.01, "r_x2": 179.67, "r_y2": 130.99, "r_x3": 70.03, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 139.01, "r_x1": 286.36, "r_y1": 139.01, "r_x2": 286.36, "r_y2": 130.99, "r_x3": 185.58, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.97, "r_x1": 113.11, "r_y1": 149.97, "r_x2": 113.11, "r_y2": 141.95, "r_x3": 70.03, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34, "r_y0": 149.76, "r_x1": 235.31, "r_y1": 149.76, "r_x2": 235.31, "r_y2": 142.03, "r_x3": 116.34, "r_y3": 142.03, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.31, "r_y0": 149.97, "r_x1": 267.68, "r_y1": 149.97, "r_x2": 267.68, "r_y2": 141.95, "r_x3": 235.31, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 161.24, "r_x1": 65.1, "r_y1": 161.24, "r_x2": 65.1, "r_y2": 153.22, "r_x3": 54.6, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.36, "r_y0": 161.24, "r_x1": 218.78, "r_y1": 161.24, "r_x2": 218.78, "r_y2": 153.22, "r_x3": 67.36, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.98, "r_y0": 161.03, "r_x1": 286.36, "r_y1": 161.03, "r_x2": 286.36, "r_y2": 153.3, "r_x3": 220.98, "r_y3": 153.3, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 171.99, "r_x1": 125.26, "r_y1": 171.99, "r_x2": 125.26, "r_y2": 164.26, "r_x3": 70.03, "r_y3": 164.26, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26, "r_y0": 172.2, "r_x1": 286.36, "r_y1": 172.2, "r_x2": 286.36, "r_y2": 164.18, "r_x3": 125.26, "r_y3": 164.18, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.15, "r_x1": 97.92, "r_y1": 183.15, "r_x2": 97.92, "r_y2": 175.14, "r_x3": 70.03, "r_y3": 175.14, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 194.43, "r_x1": 65.81, "r_y1": 194.43, "r_x2": 65.81, "r_y2": 186.41, "r_x3": 54.59, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.21, "r_y0": 194.43, "r_x1": 286.36, "r_y1": 194.43, "r_x2": 286.36, "r_y2": 186.41, "r_x3": 68.21, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.39, "r_x1": 286.36, "r_y1": 205.39, "r_x2": 286.36, "r_y2": 197.37, "r_x3": 70.03, "r_y3": 197.37, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 216.34, "r_x1": 286.36, "r_y1": 216.34, "r_x2": 286.36, "r_y2": 208.33, "r_x3": 70.03, "r_y3": 208.33, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.3, "r_x1": 245.84, "r_y1": 227.3, "r_x2": 245.84, "r_y2": 219.29, "r_x3": 70.03, "r_y3": 219.29, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 238.58, "r_x1": 65.38, "r_y1": 238.58, "r_x2": 65.38, "r_y2": 230.56, "r_x3": 54.59, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 238.58, "r_x1": 286.36, "r_y1": 238.58, "r_x2": 286.36, "r_y2": 230.56, "r_x3": 67.69, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.53, "r_x1": 286.36, "r_y1": 249.53, "r_x2": 286.36, "r_y2": 241.52, "r_x3": 70.03, "r_y3": 241.52, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.49, "r_x1": 108.4, "r_y1": 260.49, "r_x2": 108.4, "r_y2": 252.48, "r_x3": 70.03, "r_y3": 252.48, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64, "r_y0": 260.29, "r_x1": 286.36, "r_y1": 260.29, "r_x2": 286.36, "r_y2": 252.56, "r_x3": 110.64, "r_y3": 252.56, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.25, "r_x1": 140.58, "r_y1": 271.25, "r_x2": 140.58, "r_y2": 263.52, "r_x3": 70.03, "r_y3": 263.52, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.58, "r_y0": 271.45, "r_x1": 266.48, "r_y1": 271.45, "r_x2": 266.48, "r_y2": 263.44, "r_x3": 140.58, "r_y3": 263.44, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 282.72, "r_x1": 64.85, "r_y1": 282.72, "r_x2": 64.85, "r_y2": 274.71, "r_x3": 54.59, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.05, "r_y0": 282.72, "r_x1": 286.37, "r_y1": 282.72, "r_x2": 286.37, "r_y2": 274.71, "r_x3": 67.05, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.68, "r_x1": 179.57, "r_y1": 293.68, "r_x2": 179.57, "r_y2": 285.67, "r_x3": 70.03, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.02, "r_y0": 293.68, "r_x1": 194.48, "r_y1": 293.68, "r_x2": 194.48, "r_y2": 285.67, "r_x3": 187.02, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04, "r_y0": 293.48, "r_x1": 286.36, "r_y1": 293.48, "r_x2": 286.36, "r_y2": 285.75, "r_x3": 198.04, "r_y3": 285.75, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.44, "r_x1": 260.2, "r_y1": 304.44, "r_x2": 260.2, "r_y2": 296.71, "r_x3": 70.03, "r_y3": 296.71, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.2, "r_y0": 304.64, "r_x1": 286.36, "r_y1": 304.64, "r_x2": 286.36, "r_y2": 296.63, "r_x3": 260.2, "r_y3": 296.63, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.6, "r_x1": 142.75, "r_y1": 315.6, "r_x2": 142.75, "r_y2": 307.58, "r_x3": 70.03, "r_y3": 307.58, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 326.87, "r_x1": 65.62, "r_y1": 326.87, "r_x2": 65.62, "r_y2": 318.86, "r_x3": 54.59, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 326.87, "r_x1": 199.49, "r_y1": 326.87, "r_x2": 199.49, "r_y2": 318.86, "r_x3": 67.98, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.99, "r_y0": 326.87, "r_x1": 286.36, "r_y1": 326.87, "r_x2": 286.36, "r_y2": 318.86, "r_x3": 206.99, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 337.83, "r_x1": 176.28, "r_y1": 337.83, "r_x2": 176.28, "r_y2": 329.81, "r_x3": 70.03, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.6, "r_y0": 337.83, "r_x1": 190.07, "r_y1": 337.83, "r_x2": 190.07, "r_y2": 329.81, "r_x3": 182.6, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28, "r_y0": 337.62, "r_x1": 286.36, "r_y1": 337.62, "r_x2": 286.36, "r_y2": 329.9, "r_x3": 193.28, "r_y3": 329.9, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.58, "r_x1": 206.35, "r_y1": 348.58, "r_x2": 206.35, "r_y2": 340.85, "r_x3": 70.03, "r_y3": 340.85, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.35, "r_y0": 348.79, "r_x1": 274.82, "r_y1": 348.79, "r_x2": 274.82, "r_y2": 340.77, "r_x3": 206.35, "r_y3": 340.77, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 360.06, "r_x1": 65.05, "r_y1": 360.06, "r_x2": 65.05, "r_y2": 352.05, "r_x3": 54.59, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.29, "r_y0": 360.06, "r_x1": 286.36, "r_y1": 360.06, "r_x2": 286.36, "r_y2": 352.05, "r_x3": 67.29, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 371.02, "r_x1": 234.13, "r_y1": 371.02, "r_x2": 234.13, "r_y2": 363.0, "r_x3": 70.03, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05, "r_y0": 371.02, "r_x1": 286.36, "r_y1": 371.02, "r_x2": 286.36, "r_y2": 363.0, "r_x3": 240.05, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.98, "r_x1": 286.36, "r_y1": 381.98, "r_x2": 286.36, "r_y2": 373.96, "r_x3": 70.03, "r_y3": 373.96, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 70.03, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 114.58, "r_y1": 403.9, "r_x2": 114.58, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.8, "r_y0": 403.69, "r_x1": 186.73, "r_y1": 403.69, "r_x2": 186.73, "r_y2": 395.96, "r_x3": 117.8, "r_y3": 395.96, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.73, "r_y0": 403.9, "r_x1": 243.0, "r_y1": 403.9, "r_x2": 243.0, "r_y2": 395.88, "r_x3": 186.73, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 415.17, "r_x1": 65.33, "r_y1": 415.17, "r_x2": 65.33, "r_y2": 407.15, "r_x3": 54.6, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.64, "r_y0": 415.17, "r_x1": 286.36, "r_y1": 415.17, "r_x2": 286.36, "r_y2": 407.15, "r_x3": 67.64, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 426.13, "r_x1": 147.13, "r_y1": 426.13, "r_x2": 147.13, "r_y2": 418.11, "r_x3": 70.03, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.16, "r_y0": 425.92, "r_x1": 286.36, "r_y1": 425.92, "r_x2": 286.36, "r_y2": 418.19, "r_x3": 149.16, "r_y3": 418.19, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.88, "r_x1": 213.48, "r_y1": 436.88, "r_x2": 213.48, "r_y2": 429.15, "r_x3": 70.03, "r_y3": 429.15, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.48, "r_y0": 437.09, "r_x1": 261.04, "r_y1": 437.09, "r_x2": 261.04, "r_y2": 429.07, "r_x3": 213.48, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.36, "r_x1": 65.4, "r_y1": 448.36, "r_x2": 65.4, "r_y2": 440.34, "r_x3": 50.11, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 448.36, "r_x1": 286.36, "r_y1": 448.36, "r_x2": 286.36, "r_y2": 440.34, "r_x3": 67.69, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 459.32, "r_x1": 202.74, "r_y1": 459.32, "r_x2": 202.74, "r_y2": 451.3, "r_x3": 70.03, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.0, "r_y0": 459.32, "r_x1": 286.36, "r_y1": 459.32, "r_x2": 286.36, "r_y2": 451.3, "r_x3": 209.0, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 470.28, "r_x1": 286.36, "r_y1": 470.28, "r_x2": 286.36, "r_y2": 462.26, "r_x3": 70.03, "r_y3": 462.26, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 481.24, "r_x1": 141.87, "r_y1": 481.24, "r_x2": 141.87, "r_y2": 473.22, "r_x3": 70.03, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.1, "r_y0": 481.03, "r_x1": 166.02, "r_y1": 481.03, "r_x2": 166.02, "r_y2": 473.3, "r_x3": 145.1, "r_y3": 473.3, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.01, "r_y0": 481.24, "r_x1": 259.9, "r_y1": 481.24, "r_x2": 259.9, "r_y2": 473.22, "r_x3": 166.01, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.51, "r_x1": 66.03, "r_y1": 492.51, "r_x2": 66.03, "r_y2": 484.49, "r_x3": 50.11, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.42, "r_y0": 492.51, "r_x1": 286.36, "r_y1": 492.51, "r_x2": 286.36, "r_y2": 484.49, "r_x3": 68.42, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 503.47, "r_x1": 286.36, "r_y1": 503.47, "r_x2": 286.36, "r_y2": 495.45, "r_x3": 70.03, "r_y3": 495.45, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 514.22, "r_x1": 227.41, "r_y1": 514.22, "r_x2": 227.41, "r_y2": 506.49, "r_x3": 70.03, "r_y3": 506.49, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.41, "r_y0": 514.42, "r_x1": 286.36, "r_y1": 514.42, "r_x2": 286.36, "r_y2": 506.41, "r_x3": 227.41, "r_y3": 506.41, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.38, "r_x1": 286.36, "r_y1": 525.38, "r_x2": 286.36, "r_y2": 517.37, "r_x3": 70.03, "r_y3": 517.37, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 536.34, "r_x1": 112.36, "r_y1": 536.34, "r_x2": 112.36, "r_y2": 528.33, "r_x3": 70.03, "r_y3": 528.33, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 547.61, "r_x1": 65.47, "r_y1": 547.61, "r_x2": 65.47, "r_y2": 539.6, "r_x3": 50.11, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 547.61, "r_x1": 286.36, "r_y1": 547.61, "r_x2": 286.36, "r_y2": 539.6, "r_x3": 67.77, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 558.57, "r_x1": 136.28, "r_y1": 558.57, "r_x2": 136.28, "r_y2": 550.56, "r_x3": 70.03, "r_y3": 550.56, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.81, "r_y0": 558.37, "r_x1": 286.36, "r_y1": 558.37, "r_x2": 286.36, "r_y2": 550.64, "r_x3": 138.81, "r_y3": 550.64, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.33, "r_x1": 286.36, "r_y1": 569.33, "r_x2": 286.36, "r_y2": 561.6, "r_x3": 70.03, "r_y3": 561.6, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.29, "r_x1": 74.51, "r_y1": 580.29, "r_x2": 74.51, "r_y2": 572.56, "r_x3": 70.03, "r_y3": 572.56, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.51, "r_y0": 580.49, "r_x1": 286.36, "r_y1": 580.49, "r_x2": 286.36, "r_y2": 572.48, "r_x3": 74.51, "r_y3": 572.48, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.45, "r_x1": 90.36, "r_y1": 591.45, "r_x2": 90.36, "r_y2": 583.43, "r_x3": 70.03, "r_y3": 583.43, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.72, "r_x1": 66.27, "r_y1": 602.72, "r_x2": 66.27, "r_y2": 594.71, "r_x3": 50.11, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.7, "r_y0": 602.72, "r_x1": 286.36, "r_y1": 602.72, "r_x2": 286.36, "r_y2": 594.71, "r_x3": 68.7, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.68, "r_x1": 286.36, "r_y1": 613.68, "r_x2": 286.36, "r_y2": 605.66, "r_x3": 70.03, "r_y3": 605.66, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.64, "r_x1": 286.36, "r_y1": 624.64, "r_x2": 286.36, "r_y2": 616.62, "r_x3": 70.03, "r_y3": 616.62, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.6, "r_x1": 77.5, "r_y1": 635.6, "r_x2": 77.5, "r_y2": 627.58, "r_x3": 70.03, "r_y3": 627.58, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.92, "r_y0": 635.39, "r_x1": 286.36, "r_y1": 635.39, "r_x2": 286.36, "r_y2": 627.66, "r_x3": 79.92, "r_y3": 627.66, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 646.35, "r_x1": 140.68, "r_y1": 646.35, "r_x2": 140.68, "r_y2": 638.62, "r_x3": 70.03, "r_y3": 638.62, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.68, "r_y0": 646.56, "r_x1": 264.44, "r_y1": 646.56, "r_x2": 264.44, "r_y2": 638.54, "r_x3": 140.68, "r_y3": 638.54, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 657.83, "r_x1": 66.53, "r_y1": 657.83, "r_x2": 66.53, "r_y2": 649.81, "r_x3": 50.11, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 69.0, "r_y0": 657.83, "r_x1": 286.36, "r_y1": 657.83, "r_x2": 286.36, "r_y2": 649.81, "r_x3": 69.0, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.79, "r_x1": 93.2, "r_y1": 668.79, "r_x2": 93.2, "r_y2": 660.77, "r_x3": 70.03, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.2, "r_y0": 668.79, "r_x1": 286.36, "r_y1": 668.79, "r_x2": 286.36, "r_y2": 660.77, "r_x3": 102.2, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.75, "r_x1": 172.0, "r_y1": 679.75, "r_x2": 172.0, "r_y2": 671.73, "r_x3": 70.03, "r_y3": 671.73, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 691.02, "r_x1": 65.52, "r_y1": 691.02, "r_x2": 65.52, "r_y2": 683.0, "r_x3": 50.11, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.83, "r_y0": 691.02, "r_x1": 286.36, "r_y1": 691.02, "r_x2": 286.36, "r_y2": 683.0, "r_x3": 67.83, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 701.98, "r_x1": 102.16, "r_y1": 701.98, "r_x2": 102.16, "r_y2": 693.96, "r_x3": 70.03, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.55, "r_y0": 701.77, "r_x1": 231.47, "r_y1": 701.77, "r_x2": 231.47, "r_y2": 694.04, "r_x3": 107.55, "r_y3": 694.04, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.48, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 231.48, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 97.92, "r_y1": 712.94, "r_x2": 97.92, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 83.9, "r_x1": 324.75, "r_y1": 83.9, "r_x2": 324.75, "r_y2": 75.88, "r_x3": 308.86, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 327.13, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 545.11, "r_y1": 94.86, "r_x2": 545.11, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.82, "r_x1": 390.96, "r_y1": 105.82, "r_x2": 390.96, "r_y2": 97.8, "r_x3": 328.78, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27, "r_y0": 105.82, "r_x1": 435.14, "r_y1": 105.82, "r_x2": 435.14, "r_y2": 97.8, "r_x3": 400.27, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 441.71, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 440.81, "r_y1": 116.78, "r_x2": 440.81, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63, "r_y0": 116.57, "r_x1": 545.11, "r_y1": 116.57, "r_x2": 545.11, "r_y2": 108.84, "r_x3": 446.63, "r_y3": 108.84, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 127.53, "r_x1": 471.13, "r_y1": 127.53, "r_x2": 471.13, "r_y2": 119.8, "r_x3": 328.78, "r_y3": 119.8, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13, "r_y0": 127.73, "r_x1": 545.11, "r_y1": 127.73, "r_x2": 545.11, "r_y2": 119.72, "r_x3": 471.13, "r_y3": 119.72, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 138.69, "r_x1": 356.67, "r_y1": 138.69, "r_x2": 356.67, "r_y2": 130.68, "r_x3": 328.78, "r_y3": 130.68, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 150.14, "r_x1": 325.24, "r_y1": 150.14, "r_x2": 325.24, "r_y2": 142.12, "r_x3": 308.86, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.7, "r_y0": 150.14, "r_x1": 545.11, "r_y1": 150.14, "r_x2": 545.11, "r_y2": 142.12, "r_x3": 327.7, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.1, "r_x1": 414.45, "r_y1": 161.1, "r_x2": 414.45, "r_y2": 153.08, "r_x3": 328.78, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.83, "r_y0": 161.1, "r_x1": 545.11, "r_y1": 161.1, "r_x2": 545.11, "r_y2": 153.08, "r_x3": 421.83, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 172.06, "r_x1": 493.63, "r_y1": 172.06, "r_x2": 493.63, "r_y2": 164.04, "r_x3": 328.78, "r_y3": 164.04, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.5, "r_x1": 324.27, "r_y1": 183.5, "r_x2": 324.27, "r_y2": 175.49, "r_x3": 308.86, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 183.5, "r_x1": 545.11, "r_y1": 183.5, "r_x2": 545.11, "r_y2": 175.49, "r_x3": 326.58, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 194.46, "r_x1": 545.11, "r_y1": 194.46, "r_x2": 545.11, "r_y2": 186.45, "r_x3": 328.78, "r_y3": 186.45, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 205.42, "r_x1": 545.11, "r_y1": 205.42, "r_x2": 545.11, "r_y2": 197.4, "r_x3": 328.78, "r_y3": 197.4, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 216.38, "r_x1": 545.11, "r_y1": 216.38, "r_x2": 545.11, "r_y2": 208.36, "r_x3": 328.78, "r_y3": 208.36, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 227.34, "r_x1": 479.26, "r_y1": 227.34, "r_x2": 479.26, "r_y2": 219.32, "r_x3": 328.78, "r_y3": 219.32, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 227.13, "r_x1": 545.11, "r_y1": 227.13, "r_x2": 545.11, "r_y2": 219.4, "r_x3": 483.12, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 238.09, "r_x1": 519.4, "r_y1": 238.09, "r_x2": 519.4, "r_y2": 230.36, "r_x3": 328.78, "r_y3": 230.36, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.4, "r_y0": 238.3, "r_x1": 545.11, "r_y1": 238.3, "r_x2": 545.11, "r_y2": 230.28, "r_x3": 519.4, "r_y3": 230.28, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 249.26, "r_x1": 545.11, "r_y1": 249.26, "r_x2": 545.11, "r_y2": 241.24, "r_x3": 328.78, "r_y3": 241.24, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 260.21, "r_x1": 333.26, "r_y1": 260.21, "r_x2": 333.26, "r_y2": 252.2, "r_x3": 328.78, "r_y3": 252.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 271.66, "r_x1": 324.26, "r_y1": 271.66, "r_x2": 324.26, "r_y2": 263.64, "r_x3": 308.86, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 271.66, "r_x1": 545.11, "r_y1": 271.66, "r_x2": 545.11, "r_y2": 263.64, "r_x3": 326.58, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 282.62, "r_x1": 545.11, "r_y1": 282.62, "r_x2": 545.11, "r_y2": 274.6, "r_x3": 328.78, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 293.58, "r_x1": 545.11, "r_y1": 293.58, "r_x2": 545.11, "r_y2": 285.56, "r_x3": 328.78, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 304.54, "r_x1": 545.11, "r_y1": 304.54, "r_x2": 545.11, "r_y2": 296.52, "r_x3": 328.78, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 315.5, "r_x1": 352.85, "r_y1": 315.5, "r_x2": 352.85, "r_y2": 307.48, "r_x3": 328.78, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.24, "r_y0": 315.29, "r_x1": 545.11, "r_y1": 315.29, "r_x2": 545.11, "r_y2": 307.56, "r_x3": 360.24, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 326.25, "r_x1": 371.02, "r_y1": 326.25, "r_x2": 371.02, "r_y2": 318.52, "r_x3": 328.78, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.02, "r_y0": 326.45, "r_x1": 502.26, "r_y1": 326.45, "r_x2": 502.26, "r_y2": 318.44, "r_x3": 371.02, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.9, "r_x1": 323.83, "r_y1": 337.9, "r_x2": 323.83, "r_y2": 329.88, "r_x3": 308.86, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07, "r_y0": 337.9, "r_x1": 545.11, "r_y1": 337.9, "r_x2": 545.11, "r_y2": 329.88, "r_x3": 326.07, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 348.86, "r_x1": 545.11, "r_y1": 348.86, "r_x2": 545.11, "r_y2": 340.84, "r_x3": 328.78, "r_y3": 340.84, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 359.82, "r_x1": 382.78, "r_y1": 359.82, "r_x2": 382.78, "r_y2": 351.8, "r_x3": 328.78, "r_y3": 351.8, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54, "r_y0": 359.61, "r_x1": 545.12, "r_y1": 359.61, "r_x2": 545.12, "r_y2": 351.88, "r_x3": 385.54, "r_y3": 351.88, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 370.57, "r_x1": 443.6, "r_y1": 370.57, "r_x2": 443.6, "r_y2": 362.84, "r_x3": 328.78, "r_y3": 362.84, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59, "r_y0": 370.78, "r_x1": 534.49, "r_y1": 370.78, "r_x2": 534.49, "r_y2": 362.76, "r_x3": 443.59, "r_y3": 362.76, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 382.22, "r_x1": 324.6, "r_y1": 382.22, "r_x2": 324.6, "r_y2": 374.21, "r_x3": 308.86, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96, "r_y0": 382.22, "r_x1": 362.66, "r_y1": 382.22, "r_x2": 362.66, "r_y2": 374.21, "r_x3": 326.96, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69, "r_y0": 382.22, "r_x1": 389.61, "r_y1": 382.22, "r_x2": 389.61, "r_y2": 374.21, "r_x3": 368.69, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.65, "r_y0": 382.22, "r_x1": 424.56, "r_y1": 382.22, "r_x2": 424.56, "r_y2": 374.21, "r_x3": 395.65, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.55, "r_y0": 382.22, "r_x1": 438.02, "r_y1": 382.22, "r_x2": 438.02, "r_y2": 374.21, "r_x3": 431.55, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.06, "r_y0": 382.22, "r_x1": 488.5, "r_y1": 382.22, "r_x2": 488.5, "r_y2": 374.21, "r_x3": 444.06, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.48, "r_y0": 382.22, "r_x1": 515.41, "r_y1": 382.22, "r_x2": 515.41, "r_y2": 374.21, "r_x3": 495.48, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.45, "r_y0": 382.22, "r_x1": 545.11, "r_y1": 382.22, "r_x2": 545.11, "r_y2": 374.21, "r_x3": 521.45, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 393.18, "r_x1": 545.11, "r_y1": 393.18, "r_x2": 545.11, "r_y2": 385.17, "r_x3": 328.78, "r_y3": 385.17, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 404.14, "r_x1": 545.11, "r_y1": 404.14, "r_x2": 545.11, "r_y2": 396.12, "r_x3": 328.78, "r_y3": 396.12, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 415.1, "r_x1": 478.01, "r_y1": 415.1, "r_x2": 478.01, "r_y2": 407.08, "r_x3": 328.78, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.07, "r_y0": 415.1, "r_x1": 491.54, "r_y1": 415.1, "r_x2": 491.54, "r_y2": 407.08, "r_x3": 484.07, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.67, "r_y0": 414.89, "r_x1": 545.11, "r_y1": 414.89, "r_x2": 545.11, "r_y2": 407.16, "r_x3": 494.67, "r_y3": 407.16, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 425.85, "r_x1": 545.11, "r_y1": 425.85, "r_x2": 545.11, "r_y2": 418.12, "r_x3": 328.78, "r_y3": 418.12, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 436.81, "r_x1": 360.84, "r_y1": 436.81, "r_x2": 360.84, "r_y2": 429.08, "r_x3": 328.78, "r_y3": 429.08, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.84, "r_y0": 437.02, "r_x1": 475.63, "r_y1": 437.02, "r_x2": 475.63, "r_y2": 429.0, "r_x3": 360.84, "r_y3": 429.0, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.46, "r_x1": 324.57, "r_y1": 448.46, "r_x2": 324.57, "r_y2": 440.45, "r_x3": 308.86, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93, "r_y0": 448.46, "r_x1": 545.11, "r_y1": 448.46, "r_x2": 545.11, "r_y2": 440.45, "r_x3": 326.93, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 459.42, "r_x1": 545.11, "r_y1": 459.42, "r_x2": 545.11, "r_y2": 451.41, "r_x3": 328.78, "r_y3": 451.41, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 470.38, "r_x1": 545.11, "r_y1": 470.38, "r_x2": 545.11, "r_y2": 462.36, "r_x3": 328.78, "r_y3": 462.36, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 481.34, "r_x1": 545.11, "r_y1": 481.34, "r_x2": 545.11, "r_y2": 473.32, "r_x3": 328.78, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 492.3, "r_x1": 545.11, "r_y1": 492.3, "r_x2": 545.11, "r_y2": 484.28, "r_x3": 328.78, "r_y3": 484.28, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 503.26, "r_x1": 545.11, "r_y1": 503.26, "r_x2": 545.11, "r_y2": 495.24, "r_x3": 328.78, "r_y3": 495.24, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 514.22, "r_x1": 545.11, "r_y1": 514.22, "r_x2": 545.11, "r_y2": 506.2, "r_x3": 328.78, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 525.17, "r_x1": 545.11, "r_y1": 525.17, "r_x2": 545.11, "r_y2": 517.16, "r_x3": 328.78, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 536.13, "r_x1": 434.57, "r_y1": 536.13, "r_x2": 434.57, "r_y2": 528.12, "r_x3": 328.78, "r_y3": 528.12, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86, "r_y0": 535.93, "r_x1": 545.11, "r_y1": 535.93, "r_x2": 545.11, "r_y2": 528.2, "r_x3": 437.86, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 546.89, "r_x1": 425.73, "r_y1": 546.89, "r_x2": 425.73, "r_y2": 539.16, "r_x3": 328.78, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.74, "r_y0": 547.09, "r_x1": 545.11, "r_y1": 547.09, "r_x2": 545.11, "r_y2": 539.08, "r_x3": 425.74, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 558.05, "r_x1": 399.74, "r_y1": 558.05, "r_x2": 399.74, "r_y2": 550.03, "r_x3": 328.78, "r_y3": 550.03, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.5, "r_x1": 324.5, "r_y1": 569.5, "r_x2": 324.5, "r_y2": 561.48, "r_x3": 308.86, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85, "r_y0": 569.5, "r_x1": 545.11, "r_y1": 569.5, "r_x2": 545.11, "r_y2": 561.48, "r_x3": 326.85, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 580.46, "r_x1": 545.11, "r_y1": 580.46, "r_x2": 545.11, "r_y2": 572.44, "r_x3": 328.78, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 591.41, "r_x1": 545.11, "r_y1": 591.41, "r_x2": 545.11, "r_y2": 583.4, "r_x3": 328.78, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 602.37, "r_x1": 431.62, "r_y1": 602.37, "r_x2": 431.62, "r_y2": 594.36, "r_x3": 328.78, "r_y3": 594.36, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69, "r_y0": 602.17, "r_x1": 545.11, "r_y1": 602.17, "r_x2": 545.11, "r_y2": 594.44, "r_x3": 434.69, "r_y3": 594.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 613.13, "r_x1": 545.11, "r_y1": 613.13, "r_x2": 545.11, "r_y2": 605.4, "r_x3": 328.78, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 624.08, "r_x1": 367.8, "r_y1": 624.08, "r_x2": 367.8, "r_y2": 616.36, "r_x3": 328.78, "r_y3": 616.36, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.8, "r_y0": 624.29, "r_x1": 458.69, "r_y1": 624.29, "r_x2": 458.69, "r_y2": 616.28, "r_x3": 367.8, "r_y3": 616.28, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 635.74, "r_x1": 324.69, "r_y1": 635.74, "r_x2": 324.69, "r_y2": 627.72, "r_x3": 308.86, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07, "r_y0": 635.74, "r_x1": 545.11, "r_y1": 635.74, "r_x2": 545.11, "r_y2": 627.72, "r_x3": 327.07, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 646.7, "r_x1": 545.11, "r_y1": 646.7, "r_x2": 545.11, "r_y2": 638.68, "r_x3": 328.78, "r_y3": 638.68, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 657.65, "r_x1": 336.25, "r_y1": 657.65, "r_x2": 336.25, "r_y2": 649.64, "r_x3": 328.78, "r_y3": 649.64, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.12, "r_y1": 657.45, "r_x2": 545.12, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 668.41, "r_x1": 406.32, "r_y1": 668.41, "r_x2": 406.32, "r_y2": 660.68, "r_x3": 328.78, "r_y3": 660.68, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 668.61, "r_x1": 521.12, "r_y1": 668.61, "r_x2": 521.12, "r_y2": 660.6, "r_x3": 406.32, "r_y3": 660.6, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 680.06, "r_x1": 324.71, "r_y1": 680.06, "r_x2": 324.71, "r_y2": 672.04, "r_x3": 308.86, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09, "r_y0": 680.06, "r_x1": 545.11, "r_y1": 680.06, "r_x2": 545.11, "r_y2": 672.04, "r_x3": 327.09, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 691.02, "r_x1": 482.81, "r_y1": 691.02, "r_x2": 482.81, "r_y2": 683.0, "r_x3": 328.78, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75, "r_y0": 691.02, "r_x1": 545.11, "r_y1": 691.02, "r_x2": 545.11, "r_y2": 683.0, "r_x3": 488.75, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 328.78, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 379.15, "r_y1": 712.94, "r_x2": 379.15, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.62, "r_y0": 712.73, "r_x1": 545.11, "r_y1": 712.73, "r_x2": 545.11, "r_y2": 705.0, "r_x3": 381.62, "r_y3": 705.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 25, "label": "list_item", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.731, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 70.03, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 286.36, "r_y1": 94.86, "r_x2": 286.36, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 105.82, "r_x1": 85.72, "r_y1": 105.82, "r_x2": 85.72, "r_y2": 97.8, "r_x3": 70.03, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.89, "r_y0": 105.61, "r_x1": 199.93, "r_y1": 105.61, "r_x2": 199.93, "r_y2": 97.88, "r_x3": 87.89, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.94, "r_y0": 105.82, "r_x1": 286.36, "r_y1": 105.82, "r_x2": 286.36, "r_y2": 97.8, "r_x3": 199.94, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 116.78, "r_x1": 221.95, "r_y1": 116.78, "r_x2": 221.95, "r_y2": 108.76, "r_x3": 70.03, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 54.6, "t": 120.03, "r": 286.36, "b": 149.97, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 128.05, "r_x1": 65.21, "r_y1": 128.05, "r_x2": 65.21, "r_y2": 120.03, "r_x3": 54.6, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.48, "r_y0": 128.05, "r_x1": 286.36, "r_y1": 128.05, "r_x2": 286.36, "r_y2": 120.03, "r_x3": 67.48, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.01, "r_x1": 179.67, "r_y1": 139.01, "r_x2": 179.67, "r_y2": 130.99, "r_x3": 70.03, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 139.01, "r_x1": 286.36, "r_y1": 139.01, "r_x2": 286.36, "r_y2": 130.99, "r_x3": 185.58, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.97, "r_x1": 113.11, "r_y1": 149.97, "r_x2": 113.11, "r_y2": 141.95, "r_x3": 70.03, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34, "r_y0": 149.76, "r_x1": 235.31, "r_y1": 149.76, "r_x2": 235.31, "r_y2": 142.03, "r_x3": 116.34, "r_y3": 142.03, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.31, "r_y0": 149.97, "r_x1": 267.68, "r_y1": 149.97, "r_x2": 267.68, "r_y2": 141.95, "r_x3": 235.31, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 54.6, "t": 153.22, "r": 286.36, "b": 183.15, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 161.24, "r_x1": 65.1, "r_y1": 161.24, "r_x2": 65.1, "r_y2": 153.22, "r_x3": 54.6, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.36, "r_y0": 161.24, "r_x1": 218.78, "r_y1": 161.24, "r_x2": 218.78, "r_y2": 153.22, "r_x3": 67.36, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.98, "r_y0": 161.03, "r_x1": 286.36, "r_y1": 161.03, "r_x2": 286.36, "r_y2": 153.3, "r_x3": 220.98, "r_y3": 153.3, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 171.99, "r_x1": 125.26, "r_y1": 171.99, "r_x2": 125.26, "r_y2": 164.26, "r_x3": 70.03, "r_y3": 164.26, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26, "r_y0": 172.2, "r_x1": 286.36, "r_y1": 172.2, "r_x2": 286.36, "r_y2": 164.18, "r_x3": 125.26, "r_y3": 164.18, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.15, "r_x1": 97.92, "r_y1": 183.15, "r_x2": 97.92, "r_y2": 175.14, "r_x3": 70.03, "r_y3": 175.14, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 54.59, "t": 186.41, "r": 286.36, "b": 227.3, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 194.43, "r_x1": 65.81, "r_y1": 194.43, "r_x2": 65.81, "r_y2": 186.41, "r_x3": 54.59, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.21, "r_y0": 194.43, "r_x1": 286.36, "r_y1": 194.43, "r_x2": 286.36, "r_y2": 186.41, "r_x3": 68.21, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.39, "r_x1": 286.36, "r_y1": 205.39, "r_x2": 286.36, "r_y2": 197.37, "r_x3": 70.03, "r_y3": 197.37, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 216.34, "r_x1": 286.36, "r_y1": 216.34, "r_x2": 286.36, "r_y2": 208.33, "r_x3": 70.03, "r_y3": 208.33, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.3, "r_x1": 245.84, "r_y1": 227.3, "r_x2": 245.84, "r_y2": 219.29, "r_x3": 70.03, "r_y3": 219.29, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 54.59, "t": 230.56, "r": 286.36, "b": 271.45, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 238.58, "r_x1": 65.38, "r_y1": 238.58, "r_x2": 65.38, "r_y2": 230.56, "r_x3": 54.59, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 238.58, "r_x1": 286.36, "r_y1": 238.58, "r_x2": 286.36, "r_y2": 230.56, "r_x3": 67.69, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.53, "r_x1": 286.36, "r_y1": 249.53, "r_x2": 286.36, "r_y2": 241.52, "r_x3": 70.03, "r_y3": 241.52, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.49, "r_x1": 108.4, "r_y1": 260.49, "r_x2": 108.4, "r_y2": 252.48, "r_x3": 70.03, "r_y3": 252.48, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64, "r_y0": 260.29, "r_x1": 286.36, "r_y1": 260.29, "r_x2": 286.36, "r_y2": 252.56, "r_x3": 110.64, "r_y3": 252.56, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.25, "r_x1": 140.58, "r_y1": 271.25, "r_x2": 140.58, "r_y2": 263.52, "r_x3": 70.03, "r_y3": 263.52, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.58, "r_y0": 271.45, "r_x1": 266.48, "r_y1": 271.45, "r_x2": 266.48, "r_y2": 263.44, "r_x3": 140.58, "r_y3": 263.44, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 54.59, "t": 274.71, "r": 286.37, "b": 315.6, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 282.72, "r_x1": 64.85, "r_y1": 282.72, "r_x2": 64.85, "r_y2": 274.71, "r_x3": 54.59, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.05, "r_y0": 282.72, "r_x1": 286.37, "r_y1": 282.72, "r_x2": 286.37, "r_y2": 274.71, "r_x3": 67.05, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.68, "r_x1": 179.57, "r_y1": 293.68, "r_x2": 179.57, "r_y2": 285.67, "r_x3": 70.03, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.02, "r_y0": 293.68, "r_x1": 194.48, "r_y1": 293.68, "r_x2": 194.48, "r_y2": 285.67, "r_x3": 187.02, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04, "r_y0": 293.48, "r_x1": 286.36, "r_y1": 293.48, "r_x2": 286.36, "r_y2": 285.75, "r_x3": 198.04, "r_y3": 285.75, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.44, "r_x1": 260.2, "r_y1": 304.44, "r_x2": 260.2, "r_y2": 296.71, "r_x3": 70.03, "r_y3": 296.71, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.2, "r_y0": 304.64, "r_x1": 286.36, "r_y1": 304.64, "r_x2": 286.36, "r_y2": 296.63, "r_x3": 260.2, "r_y3": 296.63, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.6, "r_x1": 142.75, "r_y1": 315.6, "r_x2": 142.75, "r_y2": 307.58, "r_x3": 70.03, "r_y3": 307.58, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 54.59, "t": 318.86, "r": 286.36, "b": 348.79, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 326.87, "r_x1": 65.62, "r_y1": 326.87, "r_x2": 65.62, "r_y2": 318.86, "r_x3": 54.59, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 326.87, "r_x1": 199.49, "r_y1": 326.87, "r_x2": 199.49, "r_y2": 318.86, "r_x3": 67.98, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.99, "r_y0": 326.87, "r_x1": 286.36, "r_y1": 326.87, "r_x2": 286.36, "r_y2": 318.86, "r_x3": 206.99, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 337.83, "r_x1": 176.28, "r_y1": 337.83, "r_x2": 176.28, "r_y2": 329.81, "r_x3": 70.03, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.6, "r_y0": 337.83, "r_x1": 190.07, "r_y1": 337.83, "r_x2": 190.07, "r_y2": 329.81, "r_x3": 182.6, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28, "r_y0": 337.62, "r_x1": 286.36, "r_y1": 337.62, "r_x2": 286.36, "r_y2": 329.9, "r_x3": 193.28, "r_y3": 329.9, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.58, "r_x1": 206.35, "r_y1": 348.58, "r_x2": 206.35, "r_y2": 340.85, "r_x3": 70.03, "r_y3": 340.85, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.35, "r_y0": 348.79, "r_x1": 274.82, "r_y1": 348.79, "r_x2": 274.82, "r_y2": 340.77, "r_x3": 206.35, "r_y3": 340.77, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 54.59, "t": 352.05, "r": 286.36, "b": 403.9, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 360.06, "r_x1": 65.05, "r_y1": 360.06, "r_x2": 65.05, "r_y2": 352.05, "r_x3": 54.59, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.29, "r_y0": 360.06, "r_x1": 286.36, "r_y1": 360.06, "r_x2": 286.36, "r_y2": 352.05, "r_x3": 67.29, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 371.02, "r_x1": 234.13, "r_y1": 371.02, "r_x2": 234.13, "r_y2": 363.0, "r_x3": 70.03, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05, "r_y0": 371.02, "r_x1": 286.36, "r_y1": 371.02, "r_x2": 286.36, "r_y2": 363.0, "r_x3": 240.05, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.98, "r_x1": 286.36, "r_y1": 381.98, "r_x2": 286.36, "r_y2": 373.96, "r_x3": 70.03, "r_y3": 373.96, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 70.03, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 114.58, "r_y1": 403.9, "r_x2": 114.58, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.8, "r_y0": 403.69, "r_x1": 186.73, "r_y1": 403.69, "r_x2": 186.73, "r_y2": 395.96, "r_x3": 117.8, "r_y3": 395.96, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.73, "r_y0": 403.9, "r_x1": 243.0, "r_y1": 403.9, "r_x2": 243.0, "r_y2": 395.88, "r_x3": 186.73, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 54.6, "t": 407.15, "r": 286.36, "b": 437.09, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 415.17, "r_x1": 65.33, "r_y1": 415.17, "r_x2": 65.33, "r_y2": 407.15, "r_x3": 54.6, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.64, "r_y0": 415.17, "r_x1": 286.36, "r_y1": 415.17, "r_x2": 286.36, "r_y2": 407.15, "r_x3": 67.64, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 426.13, "r_x1": 147.13, "r_y1": 426.13, "r_x2": 147.13, "r_y2": 418.11, "r_x3": 70.03, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.16, "r_y0": 425.92, "r_x1": 286.36, "r_y1": 425.92, "r_x2": 286.36, "r_y2": 418.19, "r_x3": 149.16, "r_y3": 418.19, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.88, "r_x1": 213.48, "r_y1": 436.88, "r_x2": 213.48, "r_y2": 429.15, "r_x3": 70.03, "r_y3": 429.15, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.48, "r_y0": 437.09, "r_x1": 261.04, "r_y1": 437.09, "r_x2": 261.04, "r_y2": 429.07, "r_x3": 213.48, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "list_item", "bbox": { "l": 50.11, "t": 440.34, "r": 286.36, "b": 481.24, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.36, "r_x1": 65.4, "r_y1": 448.36, "r_x2": 65.4, "r_y2": 440.34, "r_x3": 50.11, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 448.36, "r_x1": 286.36, "r_y1": 448.36, "r_x2": 286.36, "r_y2": 440.34, "r_x3": 67.69, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 459.32, "r_x1": 202.74, "r_y1": 459.32, "r_x2": 202.74, "r_y2": 451.3, "r_x3": 70.03, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.0, "r_y0": 459.32, "r_x1": 286.36, "r_y1": 459.32, "r_x2": 286.36, "r_y2": 451.3, "r_x3": 209.0, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 470.28, "r_x1": 286.36, "r_y1": 470.28, "r_x2": 286.36, "r_y2": 462.26, "r_x3": 70.03, "r_y3": 462.26, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 481.24, "r_x1": 141.87, "r_y1": 481.24, "r_x2": 141.87, "r_y2": 473.22, "r_x3": 70.03, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.1, "r_y0": 481.03, "r_x1": 166.02, "r_y1": 481.03, "r_x2": 166.02, "r_y2": 473.3, "r_x3": 145.1, "r_y3": 473.3, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.01, "r_y0": 481.24, "r_x1": 259.9, "r_y1": 481.24, "r_x2": 259.9, "r_y2": 473.22, "r_x3": 166.01, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 484.49, "r": 286.36, "b": 536.34, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.51, "r_x1": 66.03, "r_y1": 492.51, "r_x2": 66.03, "r_y2": 484.49, "r_x3": 50.11, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.42, "r_y0": 492.51, "r_x1": 286.36, "r_y1": 492.51, "r_x2": 286.36, "r_y2": 484.49, "r_x3": 68.42, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 503.47, "r_x1": 286.36, "r_y1": 503.47, "r_x2": 286.36, "r_y2": 495.45, "r_x3": 70.03, "r_y3": 495.45, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 514.22, "r_x1": 227.41, "r_y1": 514.22, "r_x2": 227.41, "r_y2": 506.49, "r_x3": 70.03, "r_y3": 506.49, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.41, "r_y0": 514.42, "r_x1": 286.36, "r_y1": 514.42, "r_x2": 286.36, "r_y2": 506.41, "r_x3": 227.41, "r_y3": 506.41, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.38, "r_x1": 286.36, "r_y1": 525.38, "r_x2": 286.36, "r_y2": 517.37, "r_x3": 70.03, "r_y3": 517.37, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 536.34, "r_x1": 112.36, "r_y1": 536.34, "r_x2": 112.36, "r_y2": 528.33, "r_x3": 70.03, "r_y3": 528.33, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 539.6, "r": 286.36, "b": 591.45, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 547.61, "r_x1": 65.47, "r_y1": 547.61, "r_x2": 65.47, "r_y2": 539.6, "r_x3": 50.11, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 547.61, "r_x1": 286.36, "r_y1": 547.61, "r_x2": 286.36, "r_y2": 539.6, "r_x3": 67.77, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 558.57, "r_x1": 136.28, "r_y1": 558.57, "r_x2": 136.28, "r_y2": 550.56, "r_x3": 70.03, "r_y3": 550.56, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.81, "r_y0": 558.37, "r_x1": 286.36, "r_y1": 558.37, "r_x2": 286.36, "r_y2": 550.64, "r_x3": 138.81, "r_y3": 550.64, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.33, "r_x1": 286.36, "r_y1": 569.33, "r_x2": 286.36, "r_y2": 561.6, "r_x3": 70.03, "r_y3": 561.6, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.29, "r_x1": 74.51, "r_y1": 580.29, "r_x2": 74.51, "r_y2": 572.56, "r_x3": 70.03, "r_y3": 572.56, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.51, "r_y0": 580.49, "r_x1": 286.36, "r_y1": 580.49, "r_x2": 286.36, "r_y2": 572.48, "r_x3": 74.51, "r_y3": 572.48, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.45, "r_x1": 90.36, "r_y1": 591.45, "r_x2": 90.36, "r_y2": 583.43, "r_x3": 70.03, "r_y3": 583.43, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 594.71, "r": 286.36, "b": 646.56, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.72, "r_x1": 66.27, "r_y1": 602.72, "r_x2": 66.27, "r_y2": 594.71, "r_x3": 50.11, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.7, "r_y0": 602.72, "r_x1": 286.36, "r_y1": 602.72, "r_x2": 286.36, "r_y2": 594.71, "r_x3": 68.7, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.68, "r_x1": 286.36, "r_y1": 613.68, "r_x2": 286.36, "r_y2": 605.66, "r_x3": 70.03, "r_y3": 605.66, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.64, "r_x1": 286.36, "r_y1": 624.64, "r_x2": 286.36, "r_y2": 616.62, "r_x3": 70.03, "r_y3": 616.62, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.6, "r_x1": 77.5, "r_y1": 635.6, "r_x2": 77.5, "r_y2": 627.58, "r_x3": 70.03, "r_y3": 627.58, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.92, "r_y0": 635.39, "r_x1": 286.36, "r_y1": 635.39, "r_x2": 286.36, "r_y2": 627.66, "r_x3": 79.92, "r_y3": 627.66, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 646.35, "r_x1": 140.68, "r_y1": 646.35, "r_x2": 140.68, "r_y2": 638.62, "r_x3": 70.03, "r_y3": 638.62, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.68, "r_y0": 646.56, "r_x1": 264.44, "r_y1": 646.56, "r_x2": 264.44, "r_y2": 638.54, "r_x3": 140.68, "r_y3": 638.54, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 50.11, "t": 649.81, "r": 286.36, "b": 679.75, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 657.83, "r_x1": 66.53, "r_y1": 657.83, "r_x2": 66.53, "r_y2": 649.81, "r_x3": 50.11, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 69.0, "r_y0": 657.83, "r_x1": 286.36, "r_y1": 657.83, "r_x2": 286.36, "r_y2": 649.81, "r_x3": 69.0, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.79, "r_x1": 93.2, "r_y1": 668.79, "r_x2": 93.2, "r_y2": 660.77, "r_x3": 70.03, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.2, "r_y0": 668.79, "r_x1": 286.36, "r_y1": 668.79, "r_x2": 286.36, "r_y2": 660.77, "r_x3": 102.2, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.75, "r_x1": 172.0, "r_y1": 679.75, "r_x2": 172.0, "r_y2": 671.73, "r_x3": 70.03, "r_y3": 671.73, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "list_item", "bbox": { "l": 50.11, "t": 683.0, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 691.02, "r_x1": 65.52, "r_y1": 691.02, "r_x2": 65.52, "r_y2": 683.0, "r_x3": 50.11, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.83, "r_y0": 691.02, "r_x1": 286.36, "r_y1": 691.02, "r_x2": 286.36, "r_y2": 683.0, "r_x3": 67.83, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 701.98, "r_x1": 102.16, "r_y1": 701.98, "r_x2": 102.16, "r_y2": 693.96, "r_x3": 70.03, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.55, "r_y0": 701.77, "r_x1": 231.47, "r_y1": 701.77, "r_x2": 231.47, "r_y2": 694.04, "r_x3": 107.55, "r_y3": 694.04, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.48, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 231.48, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 97.92, "r_y1": 712.94, "r_x2": 97.92, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 75.88, "r": 545.11, "b": 138.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 83.9, "r_x1": 324.75, "r_y1": 83.9, "r_x2": 324.75, "r_y2": 75.88, "r_x3": 308.86, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 327.13, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 545.11, "r_y1": 94.86, "r_x2": 545.11, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.82, "r_x1": 390.96, "r_y1": 105.82, "r_x2": 390.96, "r_y2": 97.8, "r_x3": 328.78, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27, "r_y0": 105.82, "r_x1": 435.14, "r_y1": 105.82, "r_x2": 435.14, "r_y2": 97.8, "r_x3": 400.27, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 441.71, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 440.81, "r_y1": 116.78, "r_x2": 440.81, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63, "r_y0": 116.57, "r_x1": 545.11, "r_y1": 116.57, "r_x2": 545.11, "r_y2": 108.84, "r_x3": 446.63, "r_y3": 108.84, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 127.53, "r_x1": 471.13, "r_y1": 127.53, "r_x2": 471.13, "r_y2": 119.8, "r_x3": 328.78, "r_y3": 119.8, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13, "r_y0": 127.73, "r_x1": 545.11, "r_y1": 127.73, "r_x2": 545.11, "r_y2": 119.72, "r_x3": 471.13, "r_y3": 119.72, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 138.69, "r_x1": 356.67, "r_y1": 138.69, "r_x2": 356.67, "r_y2": 130.68, "r_x3": 328.78, "r_y3": 130.68, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 142.12, "r": 545.11, "b": 172.06, "coord_origin": "TOPLEFT" }, "confidence": 0.925, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 150.14, "r_x1": 325.24, "r_y1": 150.14, "r_x2": 325.24, "r_y2": 142.12, "r_x3": 308.86, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.7, "r_y0": 150.14, "r_x1": 545.11, "r_y1": 150.14, "r_x2": 545.11, "r_y2": 142.12, "r_x3": 327.7, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.1, "r_x1": 414.45, "r_y1": 161.1, "r_x2": 414.45, "r_y2": 153.08, "r_x3": 328.78, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.83, "r_y0": 161.1, "r_x1": 545.11, "r_y1": 161.1, "r_x2": 545.11, "r_y2": 153.08, "r_x3": 421.83, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 172.06, "r_x1": 493.63, "r_y1": 172.06, "r_x2": 493.63, "r_y2": 164.04, "r_x3": 328.78, "r_y3": 164.04, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 308.86, "t": 175.49, "r": 545.11, "b": 260.21, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.5, "r_x1": 324.27, "r_y1": 183.5, "r_x2": 324.27, "r_y2": 175.49, "r_x3": 308.86, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 183.5, "r_x1": 545.11, "r_y1": 183.5, "r_x2": 545.11, "r_y2": 175.49, "r_x3": 326.58, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 194.46, "r_x1": 545.11, "r_y1": 194.46, "r_x2": 545.11, "r_y2": 186.45, "r_x3": 328.78, "r_y3": 186.45, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 205.42, "r_x1": 545.11, "r_y1": 205.42, "r_x2": 545.11, "r_y2": 197.4, "r_x3": 328.78, "r_y3": 197.4, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 216.38, "r_x1": 545.11, "r_y1": 216.38, "r_x2": 545.11, "r_y2": 208.36, "r_x3": 328.78, "r_y3": 208.36, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 227.34, "r_x1": 479.26, "r_y1": 227.34, "r_x2": 479.26, "r_y2": 219.32, "r_x3": 328.78, "r_y3": 219.32, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 227.13, "r_x1": 545.11, "r_y1": 227.13, "r_x2": 545.11, "r_y2": 219.4, "r_x3": 483.12, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 238.09, "r_x1": 519.4, "r_y1": 238.09, "r_x2": 519.4, "r_y2": 230.36, "r_x3": 328.78, "r_y3": 230.36, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.4, "r_y0": 238.3, "r_x1": 545.11, "r_y1": 238.3, "r_x2": 545.11, "r_y2": 230.28, "r_x3": 519.4, "r_y3": 230.28, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 249.26, "r_x1": 545.11, "r_y1": 249.26, "r_x2": 545.11, "r_y2": 241.24, "r_x3": 328.78, "r_y3": 241.24, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 260.21, "r_x1": 333.26, "r_y1": 260.21, "r_x2": 333.26, "r_y2": 252.2, "r_x3": 328.78, "r_y3": 252.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 308.86, "t": 263.64, "r": 545.11, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 271.66, "r_x1": 324.26, "r_y1": 271.66, "r_x2": 324.26, "r_y2": 263.64, "r_x3": 308.86, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 271.66, "r_x1": 545.11, "r_y1": 271.66, "r_x2": 545.11, "r_y2": 263.64, "r_x3": 326.58, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 282.62, "r_x1": 545.11, "r_y1": 282.62, "r_x2": 545.11, "r_y2": 274.6, "r_x3": 328.78, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 293.58, "r_x1": 545.11, "r_y1": 293.58, "r_x2": 545.11, "r_y2": 285.56, "r_x3": 328.78, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 304.54, "r_x1": 545.11, "r_y1": 304.54, "r_x2": 545.11, "r_y2": 296.52, "r_x3": 328.78, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 315.5, "r_x1": 352.85, "r_y1": 315.5, "r_x2": 352.85, "r_y2": 307.48, "r_x3": 328.78, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.24, "r_y0": 315.29, "r_x1": 545.11, "r_y1": 315.29, "r_x2": 545.11, "r_y2": 307.56, "r_x3": 360.24, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 326.25, "r_x1": 371.02, "r_y1": 326.25, "r_x2": 371.02, "r_y2": 318.52, "r_x3": 328.78, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.02, "r_y0": 326.45, "r_x1": 502.26, "r_y1": 326.45, "r_x2": 502.26, "r_y2": 318.44, "r_x3": 371.02, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 329.88, "r": 545.12, "b": 370.78, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.9, "r_x1": 323.83, "r_y1": 337.9, "r_x2": 323.83, "r_y2": 329.88, "r_x3": 308.86, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07, "r_y0": 337.9, "r_x1": 545.11, "r_y1": 337.9, "r_x2": 545.11, "r_y2": 329.88, "r_x3": 326.07, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 348.86, "r_x1": 545.11, "r_y1": 348.86, "r_x2": 545.11, "r_y2": 340.84, "r_x3": 328.78, "r_y3": 340.84, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 359.82, "r_x1": 382.78, "r_y1": 359.82, "r_x2": 382.78, "r_y2": 351.8, "r_x3": 328.78, "r_y3": 351.8, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54, "r_y0": 359.61, "r_x1": 545.12, "r_y1": 359.61, "r_x2": 545.12, "r_y2": 351.88, "r_x3": 385.54, "r_y3": 351.88, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 370.57, "r_x1": 443.6, "r_y1": 370.57, "r_x2": 443.6, "r_y2": 362.84, "r_x3": 328.78, "r_y3": 362.84, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59, "r_y0": 370.78, "r_x1": 534.49, "r_y1": 370.78, "r_x2": 534.49, "r_y2": 362.76, "r_x3": 443.59, "r_y3": 362.76, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 374.21, "r": 545.11, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 382.22, "r_x1": 324.6, "r_y1": 382.22, "r_x2": 324.6, "r_y2": 374.21, "r_x3": 308.86, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96, "r_y0": 382.22, "r_x1": 362.66, "r_y1": 382.22, "r_x2": 362.66, "r_y2": 374.21, "r_x3": 326.96, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69, "r_y0": 382.22, "r_x1": 389.61, "r_y1": 382.22, "r_x2": 389.61, "r_y2": 374.21, "r_x3": 368.69, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.65, "r_y0": 382.22, "r_x1": 424.56, "r_y1": 382.22, "r_x2": 424.56, "r_y2": 374.21, "r_x3": 395.65, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.55, "r_y0": 382.22, "r_x1": 438.02, "r_y1": 382.22, "r_x2": 438.02, "r_y2": 374.21, "r_x3": 431.55, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.06, "r_y0": 382.22, "r_x1": 488.5, "r_y1": 382.22, "r_x2": 488.5, "r_y2": 374.21, "r_x3": 444.06, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.48, "r_y0": 382.22, "r_x1": 515.41, "r_y1": 382.22, "r_x2": 515.41, "r_y2": 374.21, "r_x3": 495.48, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.45, "r_y0": 382.22, "r_x1": 545.11, "r_y1": 382.22, "r_x2": 545.11, "r_y2": 374.21, "r_x3": 521.45, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 393.18, "r_x1": 545.11, "r_y1": 393.18, "r_x2": 545.11, "r_y2": 385.17, "r_x3": 328.78, "r_y3": 385.17, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 404.14, "r_x1": 545.11, "r_y1": 404.14, "r_x2": 545.11, "r_y2": 396.12, "r_x3": 328.78, "r_y3": 396.12, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 415.1, "r_x1": 478.01, "r_y1": 415.1, "r_x2": 478.01, "r_y2": 407.08, "r_x3": 328.78, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.07, "r_y0": 415.1, "r_x1": 491.54, "r_y1": 415.1, "r_x2": 491.54, "r_y2": 407.08, "r_x3": 484.07, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.67, "r_y0": 414.89, "r_x1": 545.11, "r_y1": 414.89, "r_x2": 545.11, "r_y2": 407.16, "r_x3": 494.67, "r_y3": 407.16, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 425.85, "r_x1": 545.11, "r_y1": 425.85, "r_x2": 545.11, "r_y2": 418.12, "r_x3": 328.78, "r_y3": 418.12, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 436.81, "r_x1": 360.84, "r_y1": 436.81, "r_x2": 360.84, "r_y2": 429.08, "r_x3": 328.78, "r_y3": 429.08, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.84, "r_y0": 437.02, "r_x1": 475.63, "r_y1": 437.02, "r_x2": 475.63, "r_y2": 429.0, "r_x3": 360.84, "r_y3": 429.0, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 308.86, "t": 440.45, "r": 545.11, "b": 558.05, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.46, "r_x1": 324.57, "r_y1": 448.46, "r_x2": 324.57, "r_y2": 440.45, "r_x3": 308.86, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93, "r_y0": 448.46, "r_x1": 545.11, "r_y1": 448.46, "r_x2": 545.11, "r_y2": 440.45, "r_x3": 326.93, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 459.42, "r_x1": 545.11, "r_y1": 459.42, "r_x2": 545.11, "r_y2": 451.41, "r_x3": 328.78, "r_y3": 451.41, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 470.38, "r_x1": 545.11, "r_y1": 470.38, "r_x2": 545.11, "r_y2": 462.36, "r_x3": 328.78, "r_y3": 462.36, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 481.34, "r_x1": 545.11, "r_y1": 481.34, "r_x2": 545.11, "r_y2": 473.32, "r_x3": 328.78, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 492.3, "r_x1": 545.11, "r_y1": 492.3, "r_x2": 545.11, "r_y2": 484.28, "r_x3": 328.78, "r_y3": 484.28, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 503.26, "r_x1": 545.11, "r_y1": 503.26, "r_x2": 545.11, "r_y2": 495.24, "r_x3": 328.78, "r_y3": 495.24, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 514.22, "r_x1": 545.11, "r_y1": 514.22, "r_x2": 545.11, "r_y2": 506.2, "r_x3": 328.78, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 525.17, "r_x1": 545.11, "r_y1": 525.17, "r_x2": 545.11, "r_y2": 517.16, "r_x3": 328.78, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 536.13, "r_x1": 434.57, "r_y1": 536.13, "r_x2": 434.57, "r_y2": 528.12, "r_x3": 328.78, "r_y3": 528.12, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86, "r_y0": 535.93, "r_x1": 545.11, "r_y1": 535.93, "r_x2": 545.11, "r_y2": 528.2, "r_x3": 437.86, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 546.89, "r_x1": 425.73, "r_y1": 546.89, "r_x2": 425.73, "r_y2": 539.16, "r_x3": 328.78, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.74, "r_y0": 547.09, "r_x1": 545.11, "r_y1": 547.09, "r_x2": 545.11, "r_y2": 539.08, "r_x3": 425.74, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 558.05, "r_x1": 399.74, "r_y1": 558.05, "r_x2": 399.74, "r_y2": 550.03, "r_x3": 328.78, "r_y3": 550.03, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "list_item", "bbox": { "l": 308.86, "t": 561.48, "r": 545.11, "b": 624.29, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.5, "r_x1": 324.5, "r_y1": 569.5, "r_x2": 324.5, "r_y2": 561.48, "r_x3": 308.86, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85, "r_y0": 569.5, "r_x1": 545.11, "r_y1": 569.5, "r_x2": 545.11, "r_y2": 561.48, "r_x3": 326.85, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 580.46, "r_x1": 545.11, "r_y1": 580.46, "r_x2": 545.11, "r_y2": 572.44, "r_x3": 328.78, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 591.41, "r_x1": 545.11, "r_y1": 591.41, "r_x2": 545.11, "r_y2": 583.4, "r_x3": 328.78, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 602.37, "r_x1": 431.62, "r_y1": 602.37, "r_x2": 431.62, "r_y2": 594.36, "r_x3": 328.78, "r_y3": 594.36, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69, "r_y0": 602.17, "r_x1": 545.11, "r_y1": 602.17, "r_x2": 545.11, "r_y2": 594.44, "r_x3": 434.69, "r_y3": 594.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 613.13, "r_x1": 545.11, "r_y1": 613.13, "r_x2": 545.11, "r_y2": 605.4, "r_x3": 328.78, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 624.08, "r_x1": 367.8, "r_y1": 624.08, "r_x2": 367.8, "r_y2": 616.36, "r_x3": 328.78, "r_y3": 616.36, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.8, "r_y0": 624.29, "r_x1": 458.69, "r_y1": 624.29, "r_x2": 458.69, "r_y2": 616.28, "r_x3": 367.8, "r_y3": 616.28, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "list_item", "bbox": { "l": 308.86, "t": 627.72, "r": 545.12, "b": 668.61, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 635.74, "r_x1": 324.69, "r_y1": 635.74, "r_x2": 324.69, "r_y2": 627.72, "r_x3": 308.86, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07, "r_y0": 635.74, "r_x1": 545.11, "r_y1": 635.74, "r_x2": 545.11, "r_y2": 627.72, "r_x3": 327.07, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 646.7, "r_x1": 545.11, "r_y1": 646.7, "r_x2": 545.11, "r_y2": 638.68, "r_x3": 328.78, "r_y3": 638.68, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 657.65, "r_x1": 336.25, "r_y1": 657.65, "r_x2": 336.25, "r_y2": 649.64, "r_x3": 328.78, "r_y3": 649.64, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.12, "r_y1": 657.45, "r_x2": 545.12, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 668.41, "r_x1": 406.32, "r_y1": 668.41, "r_x2": 406.32, "r_y2": 660.68, "r_x3": 328.78, "r_y3": 660.68, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 668.61, "r_x1": 521.12, "r_y1": 668.61, "r_x2": 521.12, "r_y2": 660.6, "r_x3": 406.32, "r_y3": 660.6, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "list_item", "bbox": { "l": 308.86, "t": 672.04, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.865, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 680.06, "r_x1": 324.71, "r_y1": 680.06, "r_x2": 324.71, "r_y2": 672.04, "r_x3": 308.86, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09, "r_y0": 680.06, "r_x1": 545.11, "r_y1": 680.06, "r_x2": 545.11, "r_y2": 672.04, "r_x3": 327.09, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 691.02, "r_x1": 482.81, "r_y1": 691.02, "r_x2": 482.81, "r_y2": 683.0, "r_x3": 328.78, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75, "r_y0": 691.02, "r_x1": 545.11, "r_y1": 691.02, "r_x2": 545.11, "r_y2": 683.0, "r_x3": 488.75, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 328.78, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 379.15, "r_y1": 712.94, "r_x2": 379.15, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.62, "r_y0": 712.73, "r_x1": 545.11, "r_y1": 712.73, "r_x2": 545.11, "r_y2": 705.0, "r_x3": 381.62, "r_y3": 705.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "list_item", "id": 25, "page_no": 8, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.731, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 70.03, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 286.36, "r_y1": 94.86, "r_x2": 286.36, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 105.82, "r_x1": 85.72, "r_y1": 105.82, "r_x2": 85.72, "r_y2": 97.8, "r_x3": 70.03, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.89, "r_y0": 105.61, "r_x1": 199.93, "r_y1": 105.61, "r_x2": 199.93, "r_y2": 97.88, "r_x3": 87.89, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.94, "r_y0": 105.82, "r_x1": 286.36, "r_y1": 105.82, "r_x2": 286.36, "r_y2": 97.8, "r_x3": 199.94, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 116.78, "r_x1": 221.95, "r_y1": 116.78, "r_x2": 221.95, "r_y2": 108.76, "r_x3": 70.03, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5" }, { "label": "list_item", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 54.6, "t": 120.03, "r": 286.36, "b": 149.97, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 128.05, "r_x1": 65.21, "r_y1": 128.05, "r_x2": 65.21, "r_y2": 120.03, "r_x3": 54.6, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.48, "r_y0": 128.05, "r_x1": 286.36, "r_y1": 128.05, "r_x2": 286.36, "r_y2": 120.03, "r_x3": 67.48, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.01, "r_x1": 179.67, "r_y1": 139.01, "r_x2": 179.67, "r_y2": 130.99, "r_x3": 70.03, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 139.01, "r_x1": 286.36, "r_y1": 139.01, "r_x2": 286.36, "r_y2": 130.99, "r_x3": 185.58, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.97, "r_x1": 113.11, "r_y1": 149.97, "r_x2": 113.11, "r_y2": 141.95, "r_x3": 70.03, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34, "r_y0": 149.76, "r_x1": 235.31, "r_y1": 149.76, "r_x2": 235.31, "r_y2": 142.03, "r_x3": 116.34, "r_y3": 142.03, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.31, "r_y0": 149.97, "r_x1": 267.68, "r_y1": 149.97, "r_x2": 267.68, "r_y2": 141.95, "r_x3": 235.31, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3" }, { "label": "list_item", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 54.6, "t": 153.22, "r": 286.36, "b": 183.15, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 161.24, "r_x1": 65.1, "r_y1": 161.24, "r_x2": 65.1, "r_y2": 153.22, "r_x3": 54.6, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.36, "r_y0": 161.24, "r_x1": 218.78, "r_y1": 161.24, "r_x2": 218.78, "r_y2": 153.22, "r_x3": 67.36, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.98, "r_y0": 161.03, "r_x1": 286.36, "r_y1": 161.03, "r_x2": 286.36, "r_y2": 153.3, "r_x3": 220.98, "r_y3": 153.3, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 171.99, "r_x1": 125.26, "r_y1": 171.99, "r_x2": 125.26, "r_y2": 164.26, "r_x3": 70.03, "r_y3": 164.26, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26, "r_y0": 172.2, "r_x1": 286.36, "r_y1": 172.2, "r_x2": 286.36, "r_y2": 164.18, "r_x3": 125.26, "r_y3": 164.18, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.15, "r_x1": 97.92, "r_y1": 183.15, "r_x2": 97.92, "r_y2": 175.14, "r_x3": 70.03, "r_y3": 175.14, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2" }, { "label": "list_item", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 54.59, "t": 186.41, "r": 286.36, "b": 227.3, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 194.43, "r_x1": 65.81, "r_y1": 194.43, "r_x2": 65.81, "r_y2": 186.41, "r_x3": 54.59, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.21, "r_y0": 194.43, "r_x1": 286.36, "r_y1": 194.43, "r_x2": 286.36, "r_y2": 186.41, "r_x3": 68.21, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.39, "r_x1": 286.36, "r_y1": 205.39, "r_x2": 286.36, "r_y2": 197.37, "r_x3": 70.03, "r_y3": 197.37, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 216.34, "r_x1": 286.36, "r_y1": 216.34, "r_x2": 286.36, "r_y2": 208.33, "r_x3": 70.03, "r_y3": 208.33, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.3, "r_x1": 245.84, "r_y1": 227.3, "r_x2": 245.84, "r_y2": 219.29, "r_x3": 70.03, "r_y3": 219.29, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2" }, { "label": "list_item", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 54.59, "t": 230.56, "r": 286.36, "b": 271.45, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 238.58, "r_x1": 65.38, "r_y1": 238.58, "r_x2": 65.38, "r_y2": 230.56, "r_x3": 54.59, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 238.58, "r_x1": 286.36, "r_y1": 238.58, "r_x2": 286.36, "r_y2": 230.56, "r_x3": 67.69, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.53, "r_x1": 286.36, "r_y1": 249.53, "r_x2": 286.36, "r_y2": 241.52, "r_x3": 70.03, "r_y3": 241.52, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.49, "r_x1": 108.4, "r_y1": 260.49, "r_x2": 108.4, "r_y2": 252.48, "r_x3": 70.03, "r_y3": 252.48, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64, "r_y0": 260.29, "r_x1": 286.36, "r_y1": 260.29, "r_x2": 286.36, "r_y2": 252.56, "r_x3": 110.64, "r_y3": 252.56, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.25, "r_x1": 140.58, "r_y1": 271.25, "r_x2": 140.58, "r_y2": 263.52, "r_x3": 70.03, "r_y3": 263.52, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.58, "r_y0": 271.45, "r_x1": 266.48, "r_y1": 271.45, "r_x2": 266.48, "r_y2": 263.44, "r_x3": 140.58, "r_y3": 263.44, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2" }, { "label": "list_item", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 54.59, "t": 274.71, "r": 286.37, "b": 315.6, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 282.72, "r_x1": 64.85, "r_y1": 282.72, "r_x2": 64.85, "r_y2": 274.71, "r_x3": 54.59, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.05, "r_y0": 282.72, "r_x1": 286.37, "r_y1": 282.72, "r_x2": 286.37, "r_y2": 274.71, "r_x3": 67.05, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.68, "r_x1": 179.57, "r_y1": 293.68, "r_x2": 179.57, "r_y2": 285.67, "r_x3": 70.03, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.02, "r_y0": 293.68, "r_x1": 194.48, "r_y1": 293.68, "r_x2": 194.48, "r_y2": 285.67, "r_x3": 187.02, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04, "r_y0": 293.48, "r_x1": 286.36, "r_y1": 293.48, "r_x2": 286.36, "r_y2": 285.75, "r_x3": 198.04, "r_y3": 285.75, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.44, "r_x1": 260.2, "r_y1": 304.44, "r_x2": 260.2, "r_y2": 296.71, "r_x3": 70.03, "r_y3": 296.71, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.2, "r_y0": 304.64, "r_x1": 286.36, "r_y1": 304.64, "r_x2": 286.36, "r_y2": 296.63, "r_x3": 260.2, "r_y3": 296.63, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.6, "r_x1": 142.75, "r_y1": 315.6, "r_x2": 142.75, "r_y2": 307.58, "r_x3": 70.03, "r_y3": 307.58, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2" }, { "label": "list_item", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 54.59, "t": 318.86, "r": 286.36, "b": 348.79, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 326.87, "r_x1": 65.62, "r_y1": 326.87, "r_x2": 65.62, "r_y2": 318.86, "r_x3": 54.59, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 326.87, "r_x1": 199.49, "r_y1": 326.87, "r_x2": 199.49, "r_y2": 318.86, "r_x3": 67.98, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.99, "r_y0": 326.87, "r_x1": 286.36, "r_y1": 326.87, "r_x2": 286.36, "r_y2": 318.86, "r_x3": 206.99, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 337.83, "r_x1": 176.28, "r_y1": 337.83, "r_x2": 176.28, "r_y2": 329.81, "r_x3": 70.03, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.6, "r_y0": 337.83, "r_x1": 190.07, "r_y1": 337.83, "r_x2": 190.07, "r_y2": 329.81, "r_x3": 182.6, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28, "r_y0": 337.62, "r_x1": 286.36, "r_y1": 337.62, "r_x2": 286.36, "r_y2": 329.9, "r_x3": 193.28, "r_y3": 329.9, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.58, "r_x1": 206.35, "r_y1": 348.58, "r_x2": 206.35, "r_y2": 340.85, "r_x3": 70.03, "r_y3": 340.85, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.35, "r_y0": 348.79, "r_x1": 274.82, "r_y1": 348.79, "r_x2": 274.82, "r_y2": 340.77, "r_x3": 206.35, "r_y3": 340.77, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2" }, { "label": "list_item", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 54.59, "t": 352.05, "r": 286.36, "b": 403.9, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 360.06, "r_x1": 65.05, "r_y1": 360.06, "r_x2": 65.05, "r_y2": 352.05, "r_x3": 54.59, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.29, "r_y0": 360.06, "r_x1": 286.36, "r_y1": 360.06, "r_x2": 286.36, "r_y2": 352.05, "r_x3": 67.29, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 371.02, "r_x1": 234.13, "r_y1": 371.02, "r_x2": 234.13, "r_y2": 363.0, "r_x3": 70.03, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05, "r_y0": 371.02, "r_x1": 286.36, "r_y1": 371.02, "r_x2": 286.36, "r_y2": 363.0, "r_x3": 240.05, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.98, "r_x1": 286.36, "r_y1": 381.98, "r_x2": 286.36, "r_y2": 373.96, "r_x3": 70.03, "r_y3": 373.96, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 70.03, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 114.58, "r_y1": 403.9, "r_x2": 114.58, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.8, "r_y0": 403.69, "r_x1": 186.73, "r_y1": 403.69, "r_x2": 186.73, "r_y2": 395.96, "r_x3": 117.8, "r_y3": 395.96, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.73, "r_y0": 403.9, "r_x1": 243.0, "r_y1": 403.9, "r_x2": 243.0, "r_y2": 395.88, "r_x3": 186.73, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1" }, { "label": "list_item", "id": 10, "page_no": 8, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 54.6, "t": 407.15, "r": 286.36, "b": 437.09, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 415.17, "r_x1": 65.33, "r_y1": 415.17, "r_x2": 65.33, "r_y2": 407.15, "r_x3": 54.6, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.64, "r_y0": 415.17, "r_x1": 286.36, "r_y1": 415.17, "r_x2": 286.36, "r_y2": 407.15, "r_x3": 67.64, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 426.13, "r_x1": 147.13, "r_y1": 426.13, "r_x2": 147.13, "r_y2": 418.11, "r_x3": 70.03, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.16, "r_y0": 425.92, "r_x1": 286.36, "r_y1": 425.92, "r_x2": 286.36, "r_y2": 418.19, "r_x3": 149.16, "r_y3": 418.19, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.88, "r_x1": 213.48, "r_y1": 436.88, "r_x2": 213.48, "r_y2": 429.15, "r_x3": 70.03, "r_y3": 429.15, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.48, "r_y0": 437.09, "r_x1": 261.04, "r_y1": 437.09, "r_x2": 261.04, "r_y2": 429.07, "r_x3": 213.48, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1" }, { "label": "list_item", "id": 14, "page_no": 8, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 50.11, "t": 440.34, "r": 286.36, "b": 481.24, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.36, "r_x1": 65.4, "r_y1": 448.36, "r_x2": 65.4, "r_y2": 440.34, "r_x3": 50.11, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 448.36, "r_x1": 286.36, "r_y1": 448.36, "r_x2": 286.36, "r_y2": 440.34, "r_x3": 67.69, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 459.32, "r_x1": 202.74, "r_y1": 459.32, "r_x2": 202.74, "r_y2": 451.3, "r_x3": 70.03, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.0, "r_y0": 459.32, "r_x1": 286.36, "r_y1": 459.32, "r_x2": 286.36, "r_y2": 451.3, "r_x3": 209.0, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 470.28, "r_x1": 286.36, "r_y1": 470.28, "r_x2": 286.36, "r_y2": 462.26, "r_x3": 70.03, "r_y3": 462.26, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 481.24, "r_x1": 141.87, "r_y1": 481.24, "r_x2": 141.87, "r_y2": 473.22, "r_x3": 70.03, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.1, "r_y0": 481.03, "r_x1": 166.02, "r_y1": 481.03, "r_x2": 166.02, "r_y2": 473.3, "r_x3": 145.1, "r_y3": 473.3, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.01, "r_y0": 481.24, "r_x1": 259.9, "r_y1": 481.24, "r_x2": 259.9, "r_y2": 473.22, "r_x3": 166.01, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2" }, { "label": "list_item", "id": 11, "page_no": 8, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 484.49, "r": 286.36, "b": 536.34, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.51, "r_x1": 66.03, "r_y1": 492.51, "r_x2": 66.03, "r_y2": 484.49, "r_x3": 50.11, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.42, "r_y0": 492.51, "r_x1": 286.36, "r_y1": 492.51, "r_x2": 286.36, "r_y2": 484.49, "r_x3": 68.42, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 503.47, "r_x1": 286.36, "r_y1": 503.47, "r_x2": 286.36, "r_y2": 495.45, "r_x3": 70.03, "r_y3": 495.45, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 514.22, "r_x1": 227.41, "r_y1": 514.22, "r_x2": 227.41, "r_y2": 506.49, "r_x3": 70.03, "r_y3": 506.49, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.41, "r_y0": 514.42, "r_x1": 286.36, "r_y1": 514.42, "r_x2": 286.36, "r_y2": 506.41, "r_x3": 227.41, "r_y3": 506.41, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.38, "r_x1": 286.36, "r_y1": 525.38, "r_x2": 286.36, "r_y2": 517.37, "r_x3": 70.03, "r_y3": 517.37, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 536.34, "r_x1": 112.36, "r_y1": 536.34, "r_x2": 112.36, "r_y2": 528.33, "r_x3": 70.03, "r_y3": 528.33, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2" }, { "label": "list_item", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 539.6, "r": 286.36, "b": 591.45, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 547.61, "r_x1": 65.47, "r_y1": 547.61, "r_x2": 65.47, "r_y2": 539.6, "r_x3": 50.11, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 547.61, "r_x1": 286.36, "r_y1": 547.61, "r_x2": 286.36, "r_y2": 539.6, "r_x3": 67.77, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 558.57, "r_x1": 136.28, "r_y1": 558.57, "r_x2": 136.28, "r_y2": 550.56, "r_x3": 70.03, "r_y3": 550.56, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.81, "r_y0": 558.37, "r_x1": 286.36, "r_y1": 558.37, "r_x2": 286.36, "r_y2": 550.64, "r_x3": 138.81, "r_y3": 550.64, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.33, "r_x1": 286.36, "r_y1": 569.33, "r_x2": 286.36, "r_y2": 561.6, "r_x3": 70.03, "r_y3": 561.6, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.29, "r_x1": 74.51, "r_y1": 580.29, "r_x2": 74.51, "r_y2": 572.56, "r_x3": 70.03, "r_y3": 572.56, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.51, "r_y0": 580.49, "r_x1": 286.36, "r_y1": 580.49, "r_x2": 286.36, "r_y2": 572.48, "r_x3": 74.51, "r_y3": 572.48, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.45, "r_x1": 90.36, "r_y1": 591.45, "r_x2": 90.36, "r_y2": 583.43, "r_x3": 70.03, "r_y3": 583.43, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2" }, { "label": "list_item", "id": 13, "page_no": 8, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 594.71, "r": 286.36, "b": 646.56, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.72, "r_x1": 66.27, "r_y1": 602.72, "r_x2": 66.27, "r_y2": 594.71, "r_x3": 50.11, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.7, "r_y0": 602.72, "r_x1": 286.36, "r_y1": 602.72, "r_x2": 286.36, "r_y2": 594.71, "r_x3": 68.7, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.68, "r_x1": 286.36, "r_y1": 613.68, "r_x2": 286.36, "r_y2": 605.66, "r_x3": 70.03, "r_y3": 605.66, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.64, "r_x1": 286.36, "r_y1": 624.64, "r_x2": 286.36, "r_y2": 616.62, "r_x3": 70.03, "r_y3": 616.62, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.6, "r_x1": 77.5, "r_y1": 635.6, "r_x2": 77.5, "r_y2": 627.58, "r_x3": 70.03, "r_y3": 627.58, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.92, "r_y0": 635.39, "r_x1": 286.36, "r_y1": 635.39, "r_x2": 286.36, "r_y2": 627.66, "r_x3": 79.92, "r_y3": 627.66, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 646.35, "r_x1": 140.68, "r_y1": 646.35, "r_x2": 140.68, "r_y2": 638.62, "r_x3": 70.03, "r_y3": 638.62, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.68, "r_y0": 646.56, "r_x1": 264.44, "r_y1": 646.56, "r_x2": 264.44, "r_y2": 638.54, "r_x3": 140.68, "r_y3": 638.54, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2" }, { "label": "list_item", "id": 17, "page_no": 8, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 50.11, "t": 649.81, "r": 286.36, "b": 679.75, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 657.83, "r_x1": 66.53, "r_y1": 657.83, "r_x2": 66.53, "r_y2": 649.81, "r_x3": 50.11, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 69.0, "r_y0": 657.83, "r_x1": 286.36, "r_y1": 657.83, "r_x2": 286.36, "r_y2": 649.81, "r_x3": 69.0, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.79, "r_x1": 93.2, "r_y1": 668.79, "r_x2": 93.2, "r_y2": 660.77, "r_x3": 70.03, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.2, "r_y0": 668.79, "r_x1": 286.36, "r_y1": 668.79, "r_x2": 286.36, "r_y2": 660.77, "r_x3": 102.2, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.75, "r_x1": 172.0, "r_y1": 679.75, "r_x2": 172.0, "r_y2": 671.73, "r_x3": 70.03, "r_y3": 671.73, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2" }, { "label": "list_item", "id": 16, "page_no": 8, "cluster": { "id": 16, "label": "list_item", "bbox": { "l": 50.11, "t": 683.0, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 691.02, "r_x1": 65.52, "r_y1": 691.02, "r_x2": 65.52, "r_y2": 683.0, "r_x3": 50.11, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.83, "r_y0": 691.02, "r_x1": 286.36, "r_y1": 691.02, "r_x2": 286.36, "r_y2": 683.0, "r_x3": 67.83, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 701.98, "r_x1": 102.16, "r_y1": 701.98, "r_x2": 102.16, "r_y2": 693.96, "r_x3": 70.03, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.55, "r_y0": 701.77, "r_x1": 231.47, "r_y1": 701.77, "r_x2": 231.47, "r_y2": 694.04, "r_x3": 107.55, "r_y3": 694.04, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.48, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 231.48, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 97.92, "r_y1": 712.94, "r_x2": 97.92, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6" }, { "label": "list_item", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 75.88, "r": 545.11, "b": 138.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 83.9, "r_x1": 324.75, "r_y1": 83.9, "r_x2": 324.75, "r_y2": 75.88, "r_x3": 308.86, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 327.13, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 545.11, "r_y1": 94.86, "r_x2": 545.11, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.82, "r_x1": 390.96, "r_y1": 105.82, "r_x2": 390.96, "r_y2": 97.8, "r_x3": 328.78, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27, "r_y0": 105.82, "r_x1": 435.14, "r_y1": 105.82, "r_x2": 435.14, "r_y2": 97.8, "r_x3": 400.27, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 441.71, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 440.81, "r_y1": 116.78, "r_x2": 440.81, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63, "r_y0": 116.57, "r_x1": 545.11, "r_y1": 116.57, "r_x2": 545.11, "r_y2": 108.84, "r_x3": 446.63, "r_y3": 108.84, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 127.53, "r_x1": 471.13, "r_y1": 127.53, "r_x2": 471.13, "r_y2": 119.8, "r_x3": 328.78, "r_y3": 119.8, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13, "r_y0": 127.73, "r_x1": 545.11, "r_y1": 127.73, "r_x2": 545.11, "r_y2": 119.72, "r_x3": 471.13, "r_y3": 119.72, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 138.69, "r_x1": 356.67, "r_y1": 138.69, "r_x2": 356.67, "r_y2": 130.68, "r_x3": 328.78, "r_y3": 130.68, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4" }, { "label": "list_item", "id": 15, "page_no": 8, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 142.12, "r": 545.11, "b": 172.06, "coord_origin": "TOPLEFT" }, "confidence": 0.925, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 150.14, "r_x1": 325.24, "r_y1": 150.14, "r_x2": 325.24, "r_y2": 142.12, "r_x3": 308.86, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.7, "r_y0": 150.14, "r_x1": 545.11, "r_y1": 150.14, "r_x2": 545.11, "r_y2": 142.12, "r_x3": 327.7, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.1, "r_x1": 414.45, "r_y1": 161.1, "r_x2": 414.45, "r_y2": 153.08, "r_x3": 328.78, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.83, "r_y0": 161.1, "r_x1": 545.11, "r_y1": 161.1, "r_x2": 545.11, "r_y2": 153.08, "r_x3": 421.83, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 172.06, "r_x1": 493.63, "r_y1": 172.06, "r_x2": 493.63, "r_y2": 164.04, "r_x3": 328.78, "r_y3": 164.04, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3" }, { "label": "list_item", "id": 12, "page_no": 8, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 308.86, "t": 175.49, "r": 545.11, "b": 260.21, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.5, "r_x1": 324.27, "r_y1": 183.5, "r_x2": 324.27, "r_y2": 175.49, "r_x3": 308.86, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 183.5, "r_x1": 545.11, "r_y1": 183.5, "r_x2": 545.11, "r_y2": 175.49, "r_x3": 326.58, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 194.46, "r_x1": 545.11, "r_y1": 194.46, "r_x2": 545.11, "r_y2": 186.45, "r_x3": 328.78, "r_y3": 186.45, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 205.42, "r_x1": 545.11, "r_y1": 205.42, "r_x2": 545.11, "r_y2": 197.4, "r_x3": 328.78, "r_y3": 197.4, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 216.38, "r_x1": 545.11, "r_y1": 216.38, "r_x2": 545.11, "r_y2": 208.36, "r_x3": 328.78, "r_y3": 208.36, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 227.34, "r_x1": 479.26, "r_y1": 227.34, "r_x2": 479.26, "r_y2": 219.32, "r_x3": 328.78, "r_y3": 219.32, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 227.13, "r_x1": 545.11, "r_y1": 227.13, "r_x2": 545.11, "r_y2": 219.4, "r_x3": 483.12, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 238.09, "r_x1": 519.4, "r_y1": 238.09, "r_x2": 519.4, "r_y2": 230.36, "r_x3": 328.78, "r_y3": 230.36, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.4, "r_y0": 238.3, "r_x1": 545.11, "r_y1": 238.3, "r_x2": 545.11, "r_y2": 230.28, "r_x3": 519.4, "r_y3": 230.28, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 249.26, "r_x1": 545.11, "r_y1": 249.26, "r_x2": 545.11, "r_y2": 241.24, "r_x3": 328.78, "r_y3": 241.24, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 260.21, "r_x1": 333.26, "r_y1": 260.21, "r_x2": 333.26, "r_y2": 252.2, "r_x3": 328.78, "r_y3": 252.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 308.86, "t": 263.64, "r": 545.11, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 271.66, "r_x1": 324.26, "r_y1": 271.66, "r_x2": 324.26, "r_y2": 263.64, "r_x3": 308.86, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 271.66, "r_x1": 545.11, "r_y1": 271.66, "r_x2": 545.11, "r_y2": 263.64, "r_x3": 326.58, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 282.62, "r_x1": 545.11, "r_y1": 282.62, "r_x2": 545.11, "r_y2": 274.6, "r_x3": 328.78, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 293.58, "r_x1": 545.11, "r_y1": 293.58, "r_x2": 545.11, "r_y2": 285.56, "r_x3": 328.78, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 304.54, "r_x1": 545.11, "r_y1": 304.54, "r_x2": 545.11, "r_y2": 296.52, "r_x3": 328.78, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 315.5, "r_x1": 352.85, "r_y1": 315.5, "r_x2": 352.85, "r_y2": 307.48, "r_x3": 328.78, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.24, "r_y0": 315.29, "r_x1": 545.11, "r_y1": 315.29, "r_x2": 545.11, "r_y2": 307.56, "r_x3": 360.24, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 326.25, "r_x1": 371.02, "r_y1": 326.25, "r_x2": 371.02, "r_y2": 318.52, "r_x3": 328.78, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.02, "r_y0": 326.45, "r_x1": 502.26, "r_y1": 326.45, "r_x2": 502.26, "r_y2": 318.44, "r_x3": 371.02, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1" }, { "label": "list_item", "id": 18, "page_no": 8, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 329.88, "r": 545.12, "b": 370.78, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.9, "r_x1": 323.83, "r_y1": 337.9, "r_x2": 323.83, "r_y2": 329.88, "r_x3": 308.86, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07, "r_y0": 337.9, "r_x1": 545.11, "r_y1": 337.9, "r_x2": 545.11, "r_y2": 329.88, "r_x3": 326.07, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 348.86, "r_x1": 545.11, "r_y1": 348.86, "r_x2": 545.11, "r_y2": 340.84, "r_x3": 328.78, "r_y3": 340.84, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 359.82, "r_x1": 382.78, "r_y1": 359.82, "r_x2": 382.78, "r_y2": 351.8, "r_x3": 328.78, "r_y3": 351.8, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54, "r_y0": 359.61, "r_x1": 545.12, "r_y1": 359.61, "r_x2": 545.12, "r_y2": 351.88, "r_x3": 385.54, "r_y3": 351.88, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 370.57, "r_x1": 443.6, "r_y1": 370.57, "r_x2": 443.6, "r_y2": 362.84, "r_x3": 328.78, "r_y3": 362.84, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59, "r_y0": 370.78, "r_x1": 534.49, "r_y1": 370.78, "r_x2": 534.49, "r_y2": 362.76, "r_x3": 443.59, "r_y3": 362.76, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2" }, { "label": "list_item", "id": 21, "page_no": 8, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 374.21, "r": 545.11, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 382.22, "r_x1": 324.6, "r_y1": 382.22, "r_x2": 324.6, "r_y2": 374.21, "r_x3": 308.86, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96, "r_y0": 382.22, "r_x1": 362.66, "r_y1": 382.22, "r_x2": 362.66, "r_y2": 374.21, "r_x3": 326.96, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69, "r_y0": 382.22, "r_x1": 389.61, "r_y1": 382.22, "r_x2": 389.61, "r_y2": 374.21, "r_x3": 368.69, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.65, "r_y0": 382.22, "r_x1": 424.56, "r_y1": 382.22, "r_x2": 424.56, "r_y2": 374.21, "r_x3": 395.65, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.55, "r_y0": 382.22, "r_x1": 438.02, "r_y1": 382.22, "r_x2": 438.02, "r_y2": 374.21, "r_x3": 431.55, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.06, "r_y0": 382.22, "r_x1": 488.5, "r_y1": 382.22, "r_x2": 488.5, "r_y2": 374.21, "r_x3": 444.06, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.48, "r_y0": 382.22, "r_x1": 515.41, "r_y1": 382.22, "r_x2": 515.41, "r_y2": 374.21, "r_x3": 495.48, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.45, "r_y0": 382.22, "r_x1": 545.11, "r_y1": 382.22, "r_x2": 545.11, "r_y2": 374.21, "r_x3": 521.45, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 393.18, "r_x1": 545.11, "r_y1": 393.18, "r_x2": 545.11, "r_y2": 385.17, "r_x3": 328.78, "r_y3": 385.17, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 404.14, "r_x1": 545.11, "r_y1": 404.14, "r_x2": 545.11, "r_y2": 396.12, "r_x3": 328.78, "r_y3": 396.12, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 415.1, "r_x1": 478.01, "r_y1": 415.1, "r_x2": 478.01, "r_y2": 407.08, "r_x3": 328.78, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.07, "r_y0": 415.1, "r_x1": 491.54, "r_y1": 415.1, "r_x2": 491.54, "r_y2": 407.08, "r_x3": 484.07, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.67, "r_y0": 414.89, "r_x1": 545.11, "r_y1": 414.89, "r_x2": 545.11, "r_y2": 407.16, "r_x3": 494.67, "r_y3": 407.16, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 425.85, "r_x1": 545.11, "r_y1": 425.85, "r_x2": 545.11, "r_y2": 418.12, "r_x3": 328.78, "r_y3": 418.12, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 436.81, "r_x1": 360.84, "r_y1": 436.81, "r_x2": 360.84, "r_y2": 429.08, "r_x3": 328.78, "r_y3": 429.08, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.84, "r_y0": 437.02, "r_x1": 475.63, "r_y1": 437.02, "r_x2": 475.63, "r_y2": 429.0, "r_x3": 360.84, "r_y3": 429.0, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1" }, { "label": "list_item", "id": 20, "page_no": 8, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 308.86, "t": 440.45, "r": 545.11, "b": 558.05, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.46, "r_x1": 324.57, "r_y1": 448.46, "r_x2": 324.57, "r_y2": 440.45, "r_x3": 308.86, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93, "r_y0": 448.46, "r_x1": 545.11, "r_y1": 448.46, "r_x2": 545.11, "r_y2": 440.45, "r_x3": 326.93, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 459.42, "r_x1": 545.11, "r_y1": 459.42, "r_x2": 545.11, "r_y2": 451.41, "r_x3": 328.78, "r_y3": 451.41, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 470.38, "r_x1": 545.11, "r_y1": 470.38, "r_x2": 545.11, "r_y2": 462.36, "r_x3": 328.78, "r_y3": 462.36, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 481.34, "r_x1": 545.11, "r_y1": 481.34, "r_x2": 545.11, "r_y2": 473.32, "r_x3": 328.78, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 492.3, "r_x1": 545.11, "r_y1": 492.3, "r_x2": 545.11, "r_y2": 484.28, "r_x3": 328.78, "r_y3": 484.28, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 503.26, "r_x1": 545.11, "r_y1": 503.26, "r_x2": 545.11, "r_y2": 495.24, "r_x3": 328.78, "r_y3": 495.24, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 514.22, "r_x1": 545.11, "r_y1": 514.22, "r_x2": 545.11, "r_y2": 506.2, "r_x3": 328.78, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 525.17, "r_x1": 545.11, "r_y1": 525.17, "r_x2": 545.11, "r_y2": 517.16, "r_x3": 328.78, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 536.13, "r_x1": 434.57, "r_y1": 536.13, "r_x2": 434.57, "r_y2": 528.12, "r_x3": 328.78, "r_y3": 528.12, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86, "r_y0": 535.93, "r_x1": 545.11, "r_y1": 535.93, "r_x2": 545.11, "r_y2": 528.2, "r_x3": 437.86, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 546.89, "r_x1": 425.73, "r_y1": 546.89, "r_x2": 425.73, "r_y2": 539.16, "r_x3": 328.78, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.74, "r_y0": 547.09, "r_x1": 545.11, "r_y1": 547.09, "r_x2": 545.11, "r_y2": 539.08, "r_x3": 425.74, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 558.05, "r_x1": 399.74, "r_y1": 558.05, "r_x2": 399.74, "r_y2": 550.03, "r_x3": 328.78, "r_y3": 550.03, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6" }, { "label": "list_item", "id": 19, "page_no": 8, "cluster": { "id": 19, "label": "list_item", "bbox": { "l": 308.86, "t": 561.48, "r": 545.11, "b": 624.29, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.5, "r_x1": 324.5, "r_y1": 569.5, "r_x2": 324.5, "r_y2": 561.48, "r_x3": 308.86, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85, "r_y0": 569.5, "r_x1": 545.11, "r_y1": 569.5, "r_x2": 545.11, "r_y2": 561.48, "r_x3": 326.85, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 580.46, "r_x1": 545.11, "r_y1": 580.46, "r_x2": 545.11, "r_y2": 572.44, "r_x3": 328.78, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 591.41, "r_x1": 545.11, "r_y1": 591.41, "r_x2": 545.11, "r_y2": 583.4, "r_x3": 328.78, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 602.37, "r_x1": 431.62, "r_y1": 602.37, "r_x2": 431.62, "r_y2": 594.36, "r_x3": 328.78, "r_y3": 594.36, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69, "r_y0": 602.17, "r_x1": 545.11, "r_y1": 602.17, "r_x2": 545.11, "r_y2": 594.44, "r_x3": 434.69, "r_y3": 594.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 613.13, "r_x1": 545.11, "r_y1": 613.13, "r_x2": 545.11, "r_y2": 605.4, "r_x3": 328.78, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 624.08, "r_x1": 367.8, "r_y1": 624.08, "r_x2": 367.8, "r_y2": 616.36, "r_x3": 328.78, "r_y3": 616.36, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.8, "r_y0": 624.29, "r_x1": 458.69, "r_y1": 624.29, "r_x2": 458.69, "r_y2": 616.28, "r_x3": 367.8, "r_y3": 616.28, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1" }, { "label": "list_item", "id": 23, "page_no": 8, "cluster": { "id": 23, "label": "list_item", "bbox": { "l": 308.86, "t": 627.72, "r": 545.12, "b": 668.61, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 635.74, "r_x1": 324.69, "r_y1": 635.74, "r_x2": 324.69, "r_y2": 627.72, "r_x3": 308.86, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07, "r_y0": 635.74, "r_x1": 545.11, "r_y1": 635.74, "r_x2": 545.11, "r_y2": 627.72, "r_x3": 327.07, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 646.7, "r_x1": 545.11, "r_y1": 646.7, "r_x2": 545.11, "r_y2": 638.68, "r_x3": 328.78, "r_y3": 638.68, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 657.65, "r_x1": 336.25, "r_y1": 657.65, "r_x2": 336.25, "r_y2": 649.64, "r_x3": 328.78, "r_y3": 649.64, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.12, "r_y1": 657.45, "r_x2": 545.12, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 668.41, "r_x1": 406.32, "r_y1": 668.41, "r_x2": 406.32, "r_y2": 660.68, "r_x3": 328.78, "r_y3": 660.68, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 668.61, "r_x1": 521.12, "r_y1": 668.61, "r_x2": 521.12, "r_y2": 660.6, "r_x3": 406.32, "r_y3": 660.6, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3" }, { "label": "list_item", "id": 24, "page_no": 8, "cluster": { "id": 24, "label": "list_item", "bbox": { "l": 308.86, "t": 672.04, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.865, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 680.06, "r_x1": 324.71, "r_y1": 680.06, "r_x2": 324.71, "r_y2": 672.04, "r_x3": 308.86, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09, "r_y0": 680.06, "r_x1": 545.11, "r_y1": 680.06, "r_x2": 545.11, "r_y2": 672.04, "r_x3": 327.09, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 691.02, "r_x1": 482.81, "r_y1": 691.02, "r_x2": 482.81, "r_y2": 683.0, "r_x3": 328.78, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75, "r_y0": 691.02, "r_x1": 545.11, "r_y1": 691.02, "r_x2": 545.11, "r_y2": 683.0, "r_x3": 488.75, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 328.78, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 379.15, "r_y1": 712.94, "r_x2": 379.15, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.62, "r_y0": 712.73, "r_x1": 545.11, "r_y1": 712.73, "r_x2": 545.11, "r_y2": 705.0, "r_x3": 381.62, "r_y3": 705.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on" }, { "label": "page_footer", "id": 22, "page_no": 8, "cluster": { "id": 22, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ], "body": [ { "label": "list_item", "id": 25, "page_no": 8, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.731, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 70.03, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "end object detection with transformers. In Andrea Vedaldi,", "orig": "end object detection with transformers. In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 286.36, "r_y1": 94.86, "r_x2": 286.36, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 105.82, "r_x1": 85.72, "r_y1": 105.82, "r_x2": 85.72, "r_y2": 97.8, "r_x3": 70.03, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 87.89, "r_y0": 105.61, "r_x1": 199.93, "r_y1": 105.61, "r_x2": 199.93, "r_y2": 97.88, "r_x3": 87.89, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.94, "r_y0": 105.82, "r_x1": 286.36, "r_y1": 105.82, "r_x2": 286.36, "r_y2": 97.8, "r_x3": 199.94, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 116.78, "r_x1": 221.95, "r_y1": 116.78, "r_x2": 221.95, "r_y2": 108.76, "r_x3": 70.03, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5" }, { "label": "list_item", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 54.6, "t": 120.03, "r": 286.36, "b": 149.97, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 128.05, "r_x1": 65.21, "r_y1": 128.05, "r_x2": 65.21, "r_y2": 120.03, "r_x3": 54.6, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.48, "r_y0": 128.05, "r_x1": 286.36, "r_y1": 128.05, "r_x2": 286.36, "r_y2": 120.03, "r_x3": 67.48, "r_y3": 120.03, "coord_origin": "TOPLEFT" }, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.01, "r_x1": 179.67, "r_y1": 139.01, "r_x2": 179.67, "r_y2": 130.99, "r_x3": 70.03, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 139.01, "r_x1": 286.36, "r_y1": 139.01, "r_x2": 286.36, "r_y2": 130.99, "r_x3": 185.58, "r_y3": 130.99, "coord_origin": "TOPLEFT" }, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.97, "r_x1": 113.11, "r_y1": 149.97, "r_x2": 113.11, "r_y2": 141.95, "r_x3": 70.03, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.34, "r_y0": 149.76, "r_x1": 235.31, "r_y1": 149.76, "r_x2": 235.31, "r_y2": 142.03, "r_x3": 116.34, "r_y3": 142.03, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.31, "r_y0": 149.97, "r_x1": 267.68, "r_y1": 149.97, "r_x2": 267.68, "r_y2": 141.95, "r_x3": 235.31, "r_y3": 141.95, "coord_origin": "TOPLEFT" }, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3" }, { "label": "list_item", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 54.6, "t": 153.22, "r": 286.36, "b": 183.15, "coord_origin": "TOPLEFT" }, "confidence": 0.938, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 161.24, "r_x1": 65.1, "r_y1": 161.24, "r_x2": 65.1, "r_y2": 153.22, "r_x3": 54.6, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.36, "r_y0": 161.24, "r_x1": 218.78, "r_y1": 161.24, "r_x2": 218.78, "r_y2": 153.22, "r_x3": 67.36, "r_y3": 153.22, "coord_origin": "TOPLEFT" }, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.98, "r_y0": 161.03, "r_x1": 286.36, "r_y1": 161.03, "r_x2": 286.36, "r_y2": 153.3, "r_x3": 220.98, "r_y3": 153.3, "coord_origin": "TOPLEFT" }, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 171.99, "r_x1": 125.26, "r_y1": 171.99, "r_x2": 125.26, "r_y2": 164.26, "r_x3": 70.03, "r_y3": 164.26, "coord_origin": "TOPLEFT" }, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.26, "r_y0": 172.2, "r_x1": 286.36, "r_y1": 172.2, "r_x2": 286.36, "r_y2": 164.18, "r_x3": 125.26, "r_y3": 164.18, "coord_origin": "TOPLEFT" }, "text": ", pages 647-677. Springer London, London,", "orig": ", pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.15, "r_x1": 97.92, "r_y1": 183.15, "r_x2": 97.92, "r_y2": 175.14, "r_x3": 70.03, "r_y3": 175.14, "coord_origin": "TOPLEFT" }, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2" }, { "label": "list_item", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 54.59, "t": 186.41, "r": 286.36, "b": 227.3, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 194.43, "r_x1": 65.81, "r_y1": 194.43, "r_x2": 65.81, "r_y2": 186.41, "r_x3": 54.59, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.21, "r_y0": 194.43, "r_x1": 286.36, "r_y1": 194.43, "r_x2": 286.36, "r_y2": 186.41, "r_x3": 68.21, "r_y3": 186.41, "coord_origin": "TOPLEFT" }, "text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.39, "r_x1": 286.36, "r_y1": 205.39, "r_x2": 286.36, "r_y2": 197.37, "r_x3": 70.03, "r_y3": 197.37, "coord_origin": "TOPLEFT" }, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 216.34, "r_x1": 286.36, "r_y1": 216.34, "r_x2": 286.36, "r_y2": 208.33, "r_x3": 70.03, "r_y3": 208.33, "coord_origin": "TOPLEFT" }, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.3, "r_x1": 245.84, "r_y1": 227.3, "r_x2": 245.84, "r_y2": 219.29, "r_x3": 70.03, "r_y3": 219.29, "coord_origin": "TOPLEFT" }, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2" }, { "label": "list_item", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 54.59, "t": 230.56, "r": 286.36, "b": 271.45, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 238.58, "r_x1": 65.38, "r_y1": 238.58, "r_x2": 65.38, "r_y2": 230.56, "r_x3": 54.59, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 238.58, "r_x1": 286.36, "r_y1": 238.58, "r_x2": 286.36, "r_y2": 230.56, "r_x3": 67.69, "r_y3": 230.56, "coord_origin": "TOPLEFT" }, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.53, "r_x1": 286.36, "r_y1": 249.53, "r_x2": 286.36, "r_y2": 241.52, "r_x3": 70.03, "r_y3": 241.52, "coord_origin": "TOPLEFT" }, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.49, "r_x1": 108.4, "r_y1": 260.49, "r_x2": 108.4, "r_y2": 252.48, "r_x3": 70.03, "r_y3": 252.48, "coord_origin": "TOPLEFT" }, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.64, "r_y0": 260.29, "r_x1": 286.36, "r_y1": 260.29, "r_x2": 286.36, "r_y2": 252.56, "r_x3": 110.64, "r_y3": 252.56, "coord_origin": "TOPLEFT" }, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.25, "r_x1": 140.58, "r_y1": 271.25, "r_x2": 140.58, "r_y2": 263.52, "r_x3": 70.03, "r_y3": 263.52, "coord_origin": "TOPLEFT" }, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.58, "r_y0": 271.45, "r_x1": 266.48, "r_y1": 271.45, "r_x2": 266.48, "r_y2": 263.44, "r_x3": 140.58, "r_y3": 263.44, "coord_origin": "TOPLEFT" }, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2" }, { "label": "list_item", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 54.59, "t": 274.71, "r": 286.37, "b": 315.6, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 282.72, "r_x1": 64.85, "r_y1": 282.72, "r_x2": 64.85, "r_y2": 274.71, "r_x3": 54.59, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.05, "r_y0": 282.72, "r_x1": 286.37, "r_y1": 282.72, "r_x2": 286.37, "r_y2": 274.71, "r_x3": 67.05, "r_y3": 274.71, "coord_origin": "TOPLEFT" }, "text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.68, "r_x1": 179.57, "r_y1": 293.68, "r_x2": 179.57, "r_y2": 285.67, "r_x3": 70.03, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.02, "r_y0": 293.68, "r_x1": 194.48, "r_y1": 293.68, "r_x2": 194.48, "r_y2": 285.67, "r_x3": 187.02, "r_y3": 285.67, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.04, "r_y0": 293.48, "r_x1": 286.36, "r_y1": 293.48, "r_x2": 286.36, "r_y2": 285.75, "r_x3": 198.04, "r_y3": 285.75, "coord_origin": "TOPLEFT" }, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.44, "r_x1": 260.2, "r_y1": 304.44, "r_x2": 260.2, "r_y2": 296.71, "r_x3": 70.03, "r_y3": 296.71, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 260.2, "r_y0": 304.64, "r_x1": 286.36, "r_y1": 304.64, "r_x2": 286.36, "r_y2": 296.63, "r_x3": 260.2, "r_y3": 296.63, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.6, "r_x1": 142.75, "r_y1": 315.6, "r_x2": 142.75, "r_y2": 307.58, "r_x3": 70.03, "r_y3": 307.58, "coord_origin": "TOPLEFT" }, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2" }, { "label": "list_item", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 54.59, "t": 318.86, "r": 286.36, "b": 348.79, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 326.87, "r_x1": 65.62, "r_y1": 326.87, "r_x2": 65.62, "r_y2": 318.86, "r_x3": 54.59, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 326.87, "r_x1": 199.49, "r_y1": 326.87, "r_x2": 199.49, "r_y2": 318.86, "r_x3": 67.98, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.99, "r_y0": 326.87, "r_x1": 286.36, "r_y1": 326.87, "r_x2": 286.36, "r_y2": 318.86, "r_x3": 206.99, "r_y3": 318.86, "coord_origin": "TOPLEFT" }, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 337.83, "r_x1": 176.28, "r_y1": 337.83, "r_x2": 176.28, "r_y2": 329.81, "r_x3": 70.03, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.6, "r_y0": 337.83, "r_x1": 190.07, "r_y1": 337.83, "r_x2": 190.07, "r_y2": 329.81, "r_x3": 182.6, "r_y3": 329.81, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.28, "r_y0": 337.62, "r_x1": 286.36, "r_y1": 337.62, "r_x2": 286.36, "r_y2": 329.9, "r_x3": 193.28, "r_y3": 329.9, "coord_origin": "TOPLEFT" }, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.58, "r_x1": 206.35, "r_y1": 348.58, "r_x2": 206.35, "r_y2": 340.85, "r_x3": 70.03, "r_y3": 340.85, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (SDAIR\u201995)", "orig": "Analysis and Recognition (SDAIR\u201995)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.35, "r_y0": 348.79, "r_x1": 274.82, "r_y1": 348.79, "r_x2": 274.82, "r_y2": 340.77, "r_x3": 206.35, "r_y3": 340.77, "coord_origin": "TOPLEFT" }, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2" }, { "label": "list_item", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 54.59, "t": 352.05, "r": 286.36, "b": 403.9, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.59, "r_y0": 360.06, "r_x1": 65.05, "r_y1": 360.06, "r_x2": 65.05, "r_y2": 352.05, "r_x3": 54.59, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.29, "r_y0": 360.06, "r_x1": 286.36, "r_y1": 360.06, "r_x2": 286.36, "r_y2": 352.05, "r_x3": 67.29, "r_y3": 352.05, "coord_origin": "TOPLEFT" }, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 371.02, "r_x1": 234.13, "r_y1": 371.02, "r_x2": 234.13, "r_y2": 363.0, "r_x3": 70.03, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.05, "r_y0": 371.02, "r_x1": 286.36, "r_y1": 371.02, "r_x2": 286.36, "r_y2": 363.0, "r_x3": 240.05, "r_y3": 363.0, "coord_origin": "TOPLEFT" }, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.98, "r_x1": 286.36, "r_y1": 381.98, "r_x2": 286.36, "r_y2": 373.96, "r_x3": 70.03, "r_y3": 373.96, "coord_origin": "TOPLEFT" }, "text": "tors: Cascade network for table detection in document im-", "orig": "tors: Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 70.03, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 114.58, "r_y1": 403.9, "r_x2": 114.58, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 117.8, "r_y0": 403.69, "r_x1": 186.73, "r_y1": 403.69, "r_x2": 186.73, "r_y2": 395.96, "r_x3": 117.8, "r_y3": 395.96, "coord_origin": "TOPLEFT" }, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.73, "r_y0": 403.9, "r_x1": 243.0, "r_y1": 403.9, "r_x2": 243.0, "r_y2": 395.88, "r_x3": 186.73, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1" }, { "label": "list_item", "id": 10, "page_no": 8, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 54.6, "t": 407.15, "r": 286.36, "b": 437.09, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.6, "r_y0": 415.17, "r_x1": 65.33, "r_y1": 415.17, "r_x2": 65.33, "r_y2": 407.15, "r_x3": 54.6, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.64, "r_y0": 415.17, "r_x1": 286.36, "r_y1": 415.17, "r_x2": 286.36, "r_y2": 407.15, "r_x3": 67.64, "r_y3": 407.15, "coord_origin": "TOPLEFT" }, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 426.13, "r_x1": 147.13, "r_y1": 426.13, "r_x2": 147.13, "r_y2": 418.11, "r_x3": 70.03, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.16, "r_y0": 425.92, "r_x1": 286.36, "r_y1": 425.92, "r_x2": 286.36, "r_y2": 418.19, "r_x3": 149.16, "r_y3": 418.19, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.88, "r_x1": 213.48, "r_y1": 436.88, "r_x2": 213.48, "r_y2": 429.15, "r_x3": 70.03, "r_y3": 429.15, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 213.48, "r_y0": 437.09, "r_x1": 261.04, "r_y1": 437.09, "r_x2": 261.04, "r_y2": 429.07, "r_x3": 213.48, "r_y3": 429.07, "coord_origin": "TOPLEFT" }, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1" }, { "label": "list_item", "id": 14, "page_no": 8, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 50.11, "t": 440.34, "r": 286.36, "b": 481.24, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.36, "r_x1": 65.4, "r_y1": 448.36, "r_x2": 65.4, "r_y2": 440.34, "r_x3": 50.11, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.69, "r_y0": 448.36, "r_x1": 286.36, "r_y1": 448.36, "r_x2": 286.36, "r_y2": 440.34, "r_x3": 67.69, "r_y3": 440.34, "coord_origin": "TOPLEFT" }, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 459.32, "r_x1": 202.74, "r_y1": 459.32, "r_x2": 202.74, "r_y2": 451.3, "r_x3": 70.03, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.0, "r_y0": 459.32, "r_x1": 286.36, "r_y1": 459.32, "r_x2": 286.36, "r_y2": 451.3, "r_x3": 209.0, "r_y3": 451.3, "coord_origin": "TOPLEFT" }, "text": "Pingan-vcgroup\u2019s so-", "orig": "Pingan-vcgroup\u2019s so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 470.28, "r_x1": 286.36, "r_y1": 470.28, "r_x2": 286.36, "r_y2": 462.26, "r_x3": 70.03, "r_y3": 462.26, "coord_origin": "TOPLEFT" }, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 481.24, "r_x1": 141.87, "r_y1": 481.24, "r_x2": 141.87, "r_y2": 473.22, "r_x3": 70.03, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.1, "r_y0": 481.03, "r_x1": 166.02, "r_y1": 481.03, "r_x2": 166.02, "r_y2": 473.3, "r_x3": 145.1, "r_y3": 473.3, "coord_origin": "TOPLEFT" }, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.01, "r_y0": 481.24, "r_x1": 259.9, "r_y1": 481.24, "r_x2": 259.9, "r_y2": 473.22, "r_x3": 166.01, "r_y3": 473.22, "coord_origin": "TOPLEFT" }, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2" }, { "label": "list_item", "id": 11, "page_no": 8, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 484.49, "r": 286.36, "b": 536.34, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.51, "r_x1": 66.03, "r_y1": 492.51, "r_x2": 66.03, "r_y2": 484.49, "r_x3": 50.11, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.42, "r_y0": 492.51, "r_x1": 286.36, "r_y1": 492.51, "r_x2": 286.36, "r_y2": 484.49, "r_x3": 68.42, "r_y3": 484.49, "coord_origin": "TOPLEFT" }, "text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 503.47, "r_x1": 286.36, "r_y1": 503.47, "r_x2": 286.36, "r_y2": 495.45, "r_x3": 70.03, "r_y3": 495.45, "coord_origin": "TOPLEFT" }, "text": "Gordon Wilfong. Medium-independent table detection. In", "orig": "Gordon Wilfong. Medium-independent table detection. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 514.22, "r_x1": 227.41, "r_y1": 514.22, "r_x2": 227.41, "r_y2": 506.49, "r_x3": 70.03, "r_y3": 506.49, "coord_origin": "TOPLEFT" }, "text": "Document Recognition and Retrieval VII", "orig": "Document Recognition and Retrieval VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.41, "r_y0": 514.42, "r_x1": 286.36, "r_y1": 514.42, "r_x2": 286.36, "r_y2": 506.41, "r_x3": 227.41, "r_y3": 506.41, "coord_origin": "TOPLEFT" }, "text": ", volume 3967,", "orig": ", volume 3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.38, "r_x1": 286.36, "r_y1": 525.38, "r_x2": 286.36, "r_y2": 517.37, "r_x3": 70.03, "r_y3": 517.37, "coord_origin": "TOPLEFT" }, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 536.34, "r_x1": 112.36, "r_y1": 536.34, "r_x2": 112.36, "r_y2": 528.33, "r_x3": 70.03, "r_y3": 528.33, "coord_origin": "TOPLEFT" }, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2" }, { "label": "list_item", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 539.6, "r": 286.36, "b": 591.45, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 547.61, "r_x1": 65.47, "r_y1": 547.61, "r_x2": 65.47, "r_y2": 539.6, "r_x3": 50.11, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 547.61, "r_x1": 286.36, "r_y1": 547.61, "r_x2": 286.36, "r_y2": 539.6, "r_x3": 67.77, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "Matthew Hurst. A constraint-based approach to table struc-", "orig": "Matthew Hurst. A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 558.57, "r_x1": 136.28, "r_y1": 558.57, "r_x2": 136.28, "r_y2": 550.56, "r_x3": 70.03, "r_y3": 550.56, "coord_origin": "TOPLEFT" }, "text": "ture derivation. In", "orig": "ture derivation. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.81, "r_y0": 558.37, "r_x1": 286.36, "r_y1": 558.37, "r_x2": 286.36, "r_y2": 550.64, "r_x3": 138.81, "r_y3": 550.64, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.33, "r_x1": 286.36, "r_y1": 569.33, "r_x2": 286.36, "r_y2": 561.6, "r_x3": 70.03, "r_y3": 561.6, "coord_origin": "TOPLEFT" }, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.29, "r_x1": 74.51, "r_y1": 580.29, "r_x2": 74.51, "r_y2": 572.56, "r_x3": 70.03, "r_y3": 572.56, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 74.51, "r_y0": 580.49, "r_x1": 286.36, "r_y1": 580.49, "r_x2": 286.36, "r_y2": 572.48, "r_x3": 74.51, "r_y3": 572.48, "coord_origin": "TOPLEFT" }, "text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.45, "r_x1": 90.36, "r_y1": 591.45, "r_x2": 90.36, "r_y2": 583.43, "r_x3": 70.03, "r_y3": 583.43, "coord_origin": "TOPLEFT" }, "text": "ety. 2", "orig": "ety. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2" }, { "label": "list_item", "id": 13, "page_no": 8, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 594.71, "r": 286.36, "b": 646.56, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.72, "r_x1": 66.27, "r_y1": 602.72, "r_x2": 66.27, "r_y2": 594.71, "r_x3": 50.11, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.7, "r_y0": 602.72, "r_x1": 286.36, "r_y1": 602.72, "r_x2": 286.36, "r_y2": 594.71, "r_x3": 68.7, "r_y3": 594.71, "coord_origin": "TOPLEFT" }, "text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.68, "r_x1": 286.36, "r_y1": 613.68, "r_x2": 286.36, "r_y2": 605.66, "r_x3": 70.03, "r_y3": 605.66, "coord_origin": "TOPLEFT" }, "text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.64, "r_x1": 286.36, "r_y1": 624.64, "r_x2": 286.36, "r_y2": 616.62, "r_x3": 70.03, "r_y3": 616.62, "coord_origin": "TOPLEFT" }, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.6, "r_x1": 77.5, "r_y1": 635.6, "r_x2": 77.5, "r_y2": 627.58, "r_x3": 70.03, "r_y3": 627.58, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.92, "r_y0": 635.39, "r_x1": 286.36, "r_y1": 635.39, "r_x2": 286.36, "r_y2": 627.66, "r_x3": 79.92, "r_y3": 627.66, "coord_origin": "TOPLEFT" }, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 646.35, "r_x1": 140.68, "r_y1": 646.35, "r_x2": 140.68, "r_y2": 638.62, "r_x3": 70.03, "r_y3": 638.62, "coord_origin": "TOPLEFT" }, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.68, "r_y0": 646.56, "r_x1": 264.44, "r_y1": 646.56, "r_x2": 264.44, "r_y2": 638.54, "r_x3": 140.68, "r_y3": 638.54, "coord_origin": "TOPLEFT" }, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2" }, { "label": "list_item", "id": 17, "page_no": 8, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 50.11, "t": 649.81, "r": 286.36, "b": 679.75, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 657.83, "r_x1": 66.53, "r_y1": 657.83, "r_x2": 66.53, "r_y2": 649.81, "r_x3": 50.11, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 69.0, "r_y0": 657.83, "r_x1": 286.36, "r_y1": 657.83, "r_x2": 286.36, "r_y2": 649.81, "r_x3": 69.0, "r_y3": 649.81, "coord_origin": "TOPLEFT" }, "text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.79, "r_x1": 93.2, "r_y1": 668.79, "r_x2": 93.2, "r_y2": 660.77, "r_x3": 70.03, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 102.2, "r_y0": 668.79, "r_x1": 286.36, "r_y1": 668.79, "r_x2": 286.36, "r_y2": 660.77, "r_x3": 102.2, "r_y3": 660.77, "coord_origin": "TOPLEFT" }, "text": "Icdar 2021 competition on scientific table image", "orig": "Icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.75, "r_x1": 172.0, "r_y1": 679.75, "r_x2": 172.0, "r_y2": 671.73, "r_x3": 70.03, "r_y3": 671.73, "coord_origin": "TOPLEFT" }, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2" }, { "label": "list_item", "id": 16, "page_no": 8, "cluster": { "id": 16, "label": "list_item", "bbox": { "l": 50.11, "t": 683.0, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.912, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 691.02, "r_x1": 65.52, "r_y1": 691.02, "r_x2": 65.52, "r_y2": 683.0, "r_x3": 50.11, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.83, "r_y0": 691.02, "r_x1": 286.36, "r_y1": 691.02, "r_x2": 286.36, "r_y2": 683.0, "r_x3": 67.83, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Harold W Kuhn. The hungarian method for the assignment", "orig": "Harold W Kuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 701.98, "r_x1": 102.16, "r_y1": 701.98, "r_x2": 102.16, "r_y2": 693.96, "r_x3": 70.03, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 107.55, "r_y0": 701.77, "r_x1": 231.47, "r_y1": 701.77, "r_x2": 231.47, "r_y2": 694.04, "r_x3": 107.55, "r_y3": 694.04, "coord_origin": "TOPLEFT" }, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 231.48, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 231.48, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": ", 2(1-2):83-97,", "orig": ", 2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 97.92, "r_y1": 712.94, "r_x2": 97.92, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6" }, { "label": "list_item", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 75.88, "r": 545.11, "b": 138.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 83.9, "r_x1": 324.75, "r_y1": 83.9, "r_x2": 324.75, "r_y2": 75.88, "r_x3": 308.86, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.13, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 327.13, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 545.11, "r_y1": 94.86, "r_x2": 545.11, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.82, "r_x1": 390.96, "r_y1": 105.82, "r_x2": 390.96, "r_y2": 97.8, "r_x3": 328.78, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.27, "r_y0": 105.82, "r_x1": 435.14, "r_y1": 105.82, "r_x2": 435.14, "r_y2": 97.8, "r_x3": 400.27, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.71, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 441.71, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": "Understanding and generat-", "orig": "Understanding and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 440.81, "r_y1": 116.78, "r_x2": 440.81, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.63, "r_y0": 116.57, "r_x1": 545.11, "r_y1": 116.57, "r_x2": 545.11, "r_y2": 108.84, "r_x3": 446.63, "r_y3": 108.84, "coord_origin": "TOPLEFT" }, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 127.53, "r_x1": 471.13, "r_y1": 127.53, "r_x2": 471.13, "r_y2": 119.8, "r_x3": 328.78, "r_y3": 119.8, "coord_origin": "TOPLEFT" }, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.13, "r_y0": 127.73, "r_x1": 545.11, "r_y1": 127.73, "r_x2": 545.11, "r_y2": 119.72, "r_x3": 471.13, "r_y3": 119.72, "coord_origin": "TOPLEFT" }, "text": ", 35(12):2891-2903,", "orig": ", 35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 138.69, "r_x1": 356.67, "r_y1": 138.69, "r_x2": 356.67, "r_y2": 130.68, "r_x3": 328.78, "r_y3": 130.68, "coord_origin": "TOPLEFT" }, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4" }, { "label": "list_item", "id": 15, "page_no": 8, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 142.12, "r": 545.11, "b": 172.06, "coord_origin": "TOPLEFT" }, "confidence": 0.925, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 150.14, "r_x1": 325.24, "r_y1": 150.14, "r_x2": 325.24, "r_y2": 142.12, "r_x3": 308.86, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.7, "r_y0": 150.14, "r_x1": 545.11, "r_y1": 150.14, "r_x2": 545.11, "r_y2": 142.12, "r_x3": 327.7, "r_y3": 142.12, "coord_origin": "TOPLEFT" }, "text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.1, "r_x1": 414.45, "r_y1": 161.1, "r_x2": 414.45, "r_y2": 153.08, "r_x3": 328.78, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 421.83, "r_y0": 161.1, "r_x1": 545.11, "r_y1": 161.1, "r_x2": 545.11, "r_y2": 153.08, "r_x3": 421.83, "r_y3": 153.08, "coord_origin": "TOPLEFT" }, "text": "Tablebank: A benchmark dataset", "orig": "Tablebank: A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 172.06, "r_x1": 493.63, "r_y1": 172.06, "r_x2": 493.63, "r_y2": 164.04, "r_x3": 328.78, "r_y3": 164.04, "coord_origin": "TOPLEFT" }, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3" }, { "label": "list_item", "id": 12, "page_no": 8, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 308.86, "t": 175.49, "r": 545.11, "b": 260.21, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.5, "r_x1": 324.27, "r_y1": 183.5, "r_x2": 324.27, "r_y2": 175.49, "r_x3": 308.86, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 183.5, "r_x1": 545.11, "r_y1": 183.5, "r_x2": 545.11, "r_y2": 175.49, "r_x3": 326.58, "r_y3": 175.49, "coord_origin": "TOPLEFT" }, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 194.46, "r_x1": 545.11, "r_y1": 194.46, "r_x2": 545.11, "r_y2": 186.45, "r_x3": 328.78, "r_y3": 186.45, "coord_origin": "TOPLEFT" }, "text": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 205.42, "r_x1": 545.11, "r_y1": 205.42, "r_x2": 545.11, "r_y2": 197.4, "r_x3": 328.78, "r_y3": 197.4, "coord_origin": "TOPLEFT" }, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 216.38, "r_x1": 545.11, "r_y1": 216.38, "r_x2": 545.11, "r_y2": 208.36, "r_x3": 328.78, "r_y3": 208.36, "coord_origin": "TOPLEFT" }, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 227.34, "r_x1": 479.26, "r_y1": 227.34, "r_x2": 479.26, "r_y2": 219.32, "r_x3": 328.78, "r_y3": 219.32, "coord_origin": "TOPLEFT" }, "text": "Escalante, and Roberto Vezzani, editors,", "orig": "Escalante, and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.12, "r_y0": 227.13, "r_x1": 545.11, "r_y1": 227.13, "r_x2": 545.11, "r_y2": 219.4, "r_x3": 483.12, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 238.09, "r_x1": 519.4, "r_y1": 238.09, "r_x2": 519.4, "r_y2": 230.36, "r_x3": 328.78, "r_y3": 230.36, "coord_origin": "TOPLEFT" }, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 519.4, "r_y0": 238.3, "r_x1": 545.11, "r_y1": 238.3, "r_x2": 545.11, "r_y2": 230.28, "r_x3": 519.4, "r_y3": 230.28, "coord_origin": "TOPLEFT" }, "text": ", pages", "orig": ", pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 249.26, "r_x1": 545.11, "r_y1": 249.26, "r_x2": 545.11, "r_y2": 241.24, "r_x3": 328.78, "r_y3": 241.24, "coord_origin": "TOPLEFT" }, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 260.21, "r_x1": 333.26, "r_y1": 260.21, "r_x2": 333.26, "r_y2": 252.2, "r_x3": 328.78, "r_y3": 252.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 308.86, "t": 263.64, "r": 545.11, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 271.66, "r_x1": 324.26, "r_y1": 271.66, "r_x2": 324.26, "r_y2": 263.64, "r_x3": 308.86, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.58, "r_y0": 271.66, "r_x1": 545.11, "r_y1": 271.66, "r_x2": 545.11, "r_y2": 263.64, "r_x3": 326.58, "r_y3": 263.64, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 282.62, "r_x1": 545.11, "r_y1": 282.62, "r_x2": 545.11, "r_y2": 274.6, "r_x3": 328.78, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 293.58, "r_x1": 545.11, "r_y1": 293.58, "r_x2": 545.11, "r_y2": 285.56, "r_x3": 328.78, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 304.54, "r_x1": 545.11, "r_y1": 304.54, "r_x2": 545.11, "r_y2": 296.52, "r_x3": 328.78, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "bust pdf document conversion using recurrent neural net-", "orig": "bust pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 315.5, "r_x1": 352.85, "r_y1": 315.5, "r_x2": 352.85, "r_y2": 307.48, "r_x3": 328.78, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.24, "r_y0": 315.29, "r_x1": 545.11, "r_y1": 315.29, "r_x2": 545.11, "r_y2": 307.56, "r_x3": 360.24, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 326.25, "r_x1": 371.02, "r_y1": 326.25, "r_x2": 371.02, "r_y2": 318.52, "r_x3": 328.78, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.02, "r_y0": 326.45, "r_x1": 502.26, "r_y1": 326.45, "r_x2": 502.26, "r_y2": 318.44, "r_x3": 371.02, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1" }, { "label": "list_item", "id": 18, "page_no": 8, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 329.88, "r": 545.12, "b": 370.78, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 337.9, "r_x1": 323.83, "r_y1": 337.9, "r_x2": 323.83, "r_y2": 329.88, "r_x3": 308.86, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.07, "r_y0": 337.9, "r_x1": 545.11, "r_y1": 337.9, "r_x2": 545.11, "r_y2": 329.88, "r_x3": 326.07, "r_y3": 329.88, "coord_origin": "TOPLEFT" }, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 348.86, "r_x1": 545.11, "r_y1": 348.86, "r_x2": 545.11, "r_y2": 340.84, "r_x3": 328.78, "r_y3": 340.84, "coord_origin": "TOPLEFT" }, "text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 359.82, "r_x1": 382.78, "r_y1": 359.82, "r_x2": 382.78, "r_y2": 351.8, "r_x3": 328.78, "r_y3": 351.8, "coord_origin": "TOPLEFT" }, "text": "in the wild. In", "orig": "in the wild. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 385.54, "r_y0": 359.61, "r_x1": 545.12, "r_y1": 359.61, "r_x2": 545.12, "r_y2": 351.88, "r_x3": 385.54, "r_y3": 351.88, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 370.57, "r_x1": 443.6, "r_y1": 370.57, "r_x2": 443.6, "r_y2": 362.84, "r_x3": 328.78, "r_y3": 362.84, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 443.59, "r_y0": 370.78, "r_x1": 534.49, "r_y1": 370.78, "r_x2": 534.49, "r_y2": 362.76, "r_x3": 443.59, "r_y3": 362.76, "coord_origin": "TOPLEFT" }, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2" }, { "label": "list_item", "id": 21, "page_no": 8, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 374.21, "r": 545.11, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 382.22, "r_x1": 324.6, "r_y1": 382.22, "r_x2": 324.6, "r_y2": 374.21, "r_x3": 308.86, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.96, "r_y0": 382.22, "r_x1": 362.66, "r_y1": 382.22, "r_x2": 362.66, "r_y2": 374.21, "r_x3": 326.96, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 368.69, "r_y0": 382.22, "r_x1": 389.61, "r_y1": 382.22, "r_x2": 389.61, "r_y2": 374.21, "r_x3": 368.69, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.65, "r_y0": 382.22, "r_x1": 424.56, "r_y1": 382.22, "r_x2": 424.56, "r_y2": 374.21, "r_x3": 395.65, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 431.55, "r_y0": 382.22, "r_x1": 438.02, "r_y1": 382.22, "r_x2": 438.02, "r_y2": 374.21, "r_x3": 431.55, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.06, "r_y0": 382.22, "r_x1": 488.5, "r_y1": 382.22, "r_x2": 488.5, "r_y2": 374.21, "r_x3": 444.06, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Vishwanath,", "orig": "Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 495.48, "r_y0": 382.22, "r_x1": 515.41, "r_y1": 382.22, "r_x2": 515.41, "r_y2": 374.21, "r_x3": 495.48, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 521.45, "r_y0": 382.22, "r_x1": 545.11, "r_y1": 382.22, "r_x2": 545.11, "r_y2": 374.21, "r_x3": 521.45, "r_y3": 374.21, "coord_origin": "TOPLEFT" }, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 393.18, "r_x1": 545.11, "r_y1": 393.18, "r_x2": 545.11, "r_y2": 385.17, "r_x3": 328.78, "r_y3": 385.17, "coord_origin": "TOPLEFT" }, "text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 404.14, "r_x1": 545.11, "r_y1": 404.14, "r_x2": 545.11, "r_y2": 396.12, "r_x3": 328.78, "r_y3": 396.12, "coord_origin": "TOPLEFT" }, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 415.1, "r_x1": 478.01, "r_y1": 415.1, "r_x2": 478.01, "r_y2": 407.08, "r_x3": 328.78, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 484.07, "r_y0": 415.1, "r_x1": 491.54, "r_y1": 415.1, "r_x2": 491.54, "r_y2": 407.08, "r_x3": 484.07, "r_y3": 407.08, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 494.67, "r_y0": 414.89, "r_x1": 545.11, "r_y1": 414.89, "r_x2": 545.11, "r_y2": 407.16, "r_x3": 494.67, "r_y3": 407.16, "coord_origin": "TOPLEFT" }, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 425.85, "r_x1": 545.11, "r_y1": 425.85, "r_x2": 545.11, "r_y2": 418.12, "r_x3": 328.78, "r_y3": 418.12, "coord_origin": "TOPLEFT" }, "text": "tional Conference on Document Analysis and Recognition", "orig": "tional Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 436.81, "r_x1": 360.84, "r_y1": 436.81, "r_x2": 360.84, "r_y2": 429.08, "r_x3": 328.78, "r_y3": 429.08, "coord_origin": "TOPLEFT" }, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.84, "r_y0": 437.02, "r_x1": 475.63, "r_y1": 437.02, "r_x2": 475.63, "r_y2": 429.0, "r_x3": 360.84, "r_y3": 429.0, "coord_origin": "TOPLEFT" }, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1" }, { "label": "list_item", "id": 20, "page_no": 8, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 308.86, "t": 440.45, "r": 545.11, "b": 558.05, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.46, "r_x1": 324.57, "r_y1": 448.46, "r_x2": 324.57, "r_y2": 440.45, "r_x3": 308.86, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.93, "r_y0": 448.46, "r_x1": 545.11, "r_y1": 448.46, "r_x2": 545.11, "r_y2": 440.45, "r_x3": 326.93, "r_y3": 440.45, "coord_origin": "TOPLEFT" }, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 459.42, "r_x1": 545.11, "r_y1": 459.42, "r_x2": 545.11, "r_y2": 451.41, "r_x3": 328.78, "r_y3": 451.41, "coord_origin": "TOPLEFT" }, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 470.38, "r_x1": 545.11, "r_y1": 470.38, "r_x2": 545.11, "r_y2": 462.36, "r_x3": 328.78, "r_y3": 462.36, "coord_origin": "TOPLEFT" }, "text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 481.34, "r_x1": 545.11, "r_y1": 481.34, "r_x2": 545.11, "r_y2": 473.32, "r_x3": 328.78, "r_y3": 473.32, "coord_origin": "TOPLEFT" }, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 492.3, "r_x1": 545.11, "r_y1": 492.3, "r_x2": 545.11, "r_y2": 484.28, "r_x3": 328.78, "r_y3": 484.28, "coord_origin": "TOPLEFT" }, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 503.26, "r_x1": 545.11, "r_y1": 503.26, "r_x2": 545.11, "r_y2": 495.24, "r_x3": 328.78, "r_y3": 495.24, "coord_origin": "TOPLEFT" }, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 514.22, "r_x1": 545.11, "r_y1": 514.22, "r_x2": 545.11, "r_y2": 506.2, "r_x3": 328.78, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 525.17, "r_x1": 545.11, "r_y1": 525.17, "r_x2": 545.11, "r_y2": 517.16, "r_x3": 328.78, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 536.13, "r_x1": 434.57, "r_y1": 536.13, "r_x2": 434.57, "r_y2": 528.12, "r_x3": 328.78, "r_y3": 528.12, "coord_origin": "TOPLEFT" }, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.86, "r_y0": 535.93, "r_x1": 545.11, "r_y1": 535.93, "r_x2": 545.11, "r_y2": 528.2, "r_x3": 437.86, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 546.89, "r_x1": 425.73, "r_y1": 546.89, "r_x2": 425.73, "r_y2": 539.16, "r_x3": 328.78, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 425.74, "r_y0": 547.09, "r_x1": 545.11, "r_y1": 547.09, "r_x2": 545.11, "r_y2": 539.08, "r_x3": 425.74, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 558.05, "r_x1": 399.74, "r_y1": 558.05, "r_x2": 399.74, "r_y2": 550.03, "r_x3": 328.78, "r_y3": 550.03, "coord_origin": "TOPLEFT" }, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6" }, { "label": "list_item", "id": 19, "page_no": 8, "cluster": { "id": 19, "label": "list_item", "bbox": { "l": 308.86, "t": 561.48, "r": 545.11, "b": 624.29, "coord_origin": "TOPLEFT" }, "confidence": 0.903, "cells": [ { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 569.5, "r_x1": 324.5, "r_y1": 569.5, "r_x2": 324.5, "r_y2": 561.48, "r_x3": 308.86, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.85, "r_y0": 569.5, "r_x1": 545.11, "r_y1": 569.5, "r_x2": 545.11, "r_y2": 561.48, "r_x3": 326.85, "r_y3": 561.48, "coord_origin": "TOPLEFT" }, "text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 580.46, "r_x1": 545.11, "r_y1": 580.46, "r_x2": 545.11, "r_y2": 572.44, "r_x3": 328.78, "r_y3": 572.44, "coord_origin": "TOPLEFT" }, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 591.41, "r_x1": 545.11, "r_y1": 591.41, "r_x2": 545.11, "r_y2": 583.4, "r_x3": 328.78, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 602.37, "r_x1": 431.62, "r_y1": 602.37, "r_x2": 431.62, "r_y2": 594.36, "r_x3": 328.78, "r_y3": 594.36, "coord_origin": "TOPLEFT" }, "text": "image-based documents. In", "orig": "image-based documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.69, "r_y0": 602.17, "r_x1": 545.11, "r_y1": 602.17, "r_x2": 545.11, "r_y2": 594.44, "r_x3": 434.69, "r_y3": 594.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 613.13, "r_x1": 545.11, "r_y1": 613.13, "r_x2": 545.11, "r_y2": 605.4, "r_x3": 328.78, "r_y3": 605.4, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition", "orig": "Conference on Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 624.08, "r_x1": 367.8, "r_y1": 624.08, "r_x2": 367.8, "r_y2": 616.36, "r_x3": 328.78, "r_y3": 616.36, "coord_origin": "TOPLEFT" }, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.8, "r_y0": 624.29, "r_x1": 458.69, "r_y1": 624.29, "r_x2": 458.69, "r_y2": 616.28, "r_x3": 367.8, "r_y3": 616.28, "coord_origin": "TOPLEFT" }, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1" }, { "label": "list_item", "id": 23, "page_no": 8, "cluster": { "id": 23, "label": "list_item", "bbox": { "l": 308.86, "t": 627.72, "r": 545.12, "b": 668.61, "coord_origin": "TOPLEFT" }, "confidence": 0.878, "cells": [ { "index": 186, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 635.74, "r_x1": 324.69, "r_y1": 635.74, "r_x2": 324.69, "r_y2": 627.72, "r_x3": 308.86, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 187, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.07, "r_y0": 635.74, "r_x1": 545.11, "r_y1": 635.74, "r_x2": 545.11, "r_y2": 627.72, "r_x3": 327.07, "r_y3": 627.72, "coord_origin": "TOPLEFT" }, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 188, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 646.7, "r_x1": 545.11, "r_y1": 646.7, "r_x2": 545.11, "r_y2": 638.68, "r_x3": 328.78, "r_y3": 638.68, "coord_origin": "TOPLEFT" }, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 189, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 657.65, "r_x1": 336.25, "r_y1": 657.65, "r_x2": 336.25, "r_y2": 649.64, "r_x3": 328.78, "r_y3": 649.64, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 190, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.12, "r_y1": 657.45, "r_x2": 545.12, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 191, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 668.41, "r_x1": 406.32, "r_y1": 668.41, "r_x2": 406.32, "r_y2": 660.68, "r_x3": 328.78, "r_y3": 660.68, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 192, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 668.61, "r_x1": 521.12, "r_y1": 668.61, "r_x2": 521.12, "r_y2": 660.6, "r_x3": 406.32, "r_y3": 660.6, "coord_origin": "TOPLEFT" }, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3" }, { "label": "list_item", "id": 24, "page_no": 8, "cluster": { "id": 24, "label": "list_item", "bbox": { "l": 308.86, "t": 672.04, "r": 545.11, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.865, "cells": [ { "index": 193, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 680.06, "r_x1": 324.71, "r_y1": 680.06, "r_x2": 324.71, "r_y2": 672.04, "r_x3": 308.86, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 194, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.09, "r_y0": 680.06, "r_x1": 545.11, "r_y1": 680.06, "r_x2": 545.11, "r_y2": 672.04, "r_x3": 327.09, "r_y3": 672.04, "coord_origin": "TOPLEFT" }, "text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 195, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 691.02, "r_x1": 482.81, "r_y1": 691.02, "r_x2": 482.81, "r_y2": 683.0, "r_x3": 328.78, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 196, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.75, "r_y0": 691.02, "r_x1": 545.11, "r_y1": 691.02, "r_x2": 545.11, "r_y2": 683.0, "r_x3": 488.75, "r_y3": 683.0, "coord_origin": "TOPLEFT" }, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 197, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 701.98, "r_x1": 545.11, "r_y1": 701.98, "r_x2": 545.11, "r_y2": 693.96, "r_x3": 328.78, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 198, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 712.94, "r_x1": 379.15, "r_y1": 712.94, "r_x2": 379.15, "r_y2": 704.92, "r_x3": 328.78, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "regression. In", "orig": "regression. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 199, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 381.62, "r_y0": 712.73, "r_x1": 545.11, "r_y1": 712.73, "r_x2": 545.11, "r_y2": 705.0, "r_x3": 381.62, "r_y3": 705.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on" } ], "headers": [ { "label": "page_footer", "id": 22, "page_no": 8, "cluster": { "id": 22, "label": "page_footer", "bbox": { "l": 295.12, "t": 734.13, "r": 300.1, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 200, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.12, "r_y0": 743.04, "r_x1": 300.1, "r_y1": 743.04, "r_x2": 300.1, "r_y2": 734.13, "r_x3": 295.12, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ] } }, { "page_no": 9, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.69, "r_x1": 223.58, "r_y1": 83.69, "r_x2": 223.58, "r_y2": 75.96, "r_x3": 70.03, "r_y3": 75.96, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.58, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 223.58, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 97.92, "r_y1": 94.86, "r_x2": 97.92, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 106.18, "r_x1": 65.53, "r_y1": 106.18, "r_x2": 65.53, "r_y2": 98.17, "r_x3": 50.11, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 106.18, "r_x1": 286.36, "r_y1": 106.18, "r_x2": 286.36, "r_y2": 98.17, "r_x3": 67.85, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 117.14, "r_x1": 286.36, "r_y1": 117.14, "r_x2": 286.36, "r_y2": 109.12, "r_x3": 70.03, "r_y3": 109.12, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 128.1, "r_x1": 286.36, "r_y1": 128.1, "r_x2": 286.36, "r_y2": 120.08, "r_x3": 70.03, "r_y3": 120.08, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.06, "r_x1": 77.5, "r_y1": 139.06, "r_x2": 77.5, "r_y2": 131.04, "r_x3": 70.03, "r_y3": 131.04, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.56, "r_y0": 138.85, "r_x1": 286.37, "r_y1": 138.85, "r_x2": 286.37, "r_y2": 131.12, "r_x3": 80.56, "r_y3": 131.12, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.81, "r_x1": 195.23, "r_y1": 149.81, "r_x2": 195.23, "r_y2": 142.08, "r_x3": 70.03, "r_y3": 142.08, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.23, "r_y0": 150.02, "r_x1": 286.37, "r_y1": 150.02, "r_x2": 286.37, "r_y2": 142.0, "r_x3": 195.23, "r_y3": 142.0, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 160.98, "r_x1": 120.33, "r_y1": 160.98, "r_x2": 120.33, "r_y2": 152.96, "r_x3": 70.03, "r_y3": 152.96, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 172.3, "r_x1": 65.53, "r_y1": 172.3, "r_x2": 65.53, "r_y2": 164.28, "r_x3": 50.11, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 172.3, "r_x1": 286.36, "r_y1": 172.3, "r_x2": 286.36, "r_y2": 164.28, "r_x3": 67.85, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.26, "r_x1": 286.36, "r_y1": 183.26, "r_x2": 286.36, "r_y2": 175.24, "r_x3": 70.03, "r_y3": 175.24, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 194.22, "r_x1": 286.36, "r_y1": 194.22, "r_x2": 286.36, "r_y2": 186.2, "r_x3": 70.03, "r_y3": 186.2, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.18, "r_x1": 101.33, "r_y1": 205.18, "r_x2": 101.33, "r_y2": 197.16, "r_x3": 70.03, "r_y3": 197.16, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33, "r_y0": 204.97, "r_x1": 286.36, "r_y1": 204.97, "r_x2": 286.36, "r_y2": 197.24, "r_x3": 104.33, "r_y3": 197.24, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 215.93, "r_x1": 220.49, "r_y1": 215.93, "r_x2": 220.49, "r_y2": 208.2, "r_x3": 70.03, "r_y3": 208.2, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48, "r_y0": 216.14, "r_x1": 286.36, "r_y1": 216.14, "r_x2": 286.36, "r_y2": 208.12, "r_x3": 220.48, "r_y3": 208.12, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.09, "r_x1": 166.65, "r_y1": 227.09, "r_x2": 166.65, "r_y2": 219.08, "r_x3": 70.03, "r_y3": 219.08, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 238.42, "r_x1": 65.65, "r_y1": 238.42, "r_x2": 65.65, "r_y2": 230.4, "r_x3": 50.11, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 238.42, "r_x1": 286.36, "r_y1": 238.42, "r_x2": 286.36, "r_y2": 230.4, "r_x3": 67.98, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.38, "r_x1": 147.17, "r_y1": 249.38, "r_x2": 147.17, "r_y2": 241.36, "r_x3": 70.03, "r_y3": 241.36, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93, "r_y0": 249.17, "r_x1": 286.37, "r_y1": 249.17, "r_x2": 286.37, "r_y2": 241.44, "r_x3": 149.93, "r_y3": 241.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.13, "r_x1": 244.69, "r_y1": 260.13, "r_x2": 244.69, "r_y2": 252.4, "r_x3": 70.03, "r_y3": 252.4, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69, "r_y0": 260.34, "r_x1": 286.36, "r_y1": 260.34, "r_x2": 286.36, "r_y2": 252.32, "r_x3": 244.69, "r_y3": 252.32, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.3, "r_x1": 111.37, "r_y1": 271.3, "r_x2": 111.37, "r_y2": 263.28, "r_x3": 70.03, "r_y3": 263.28, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 282.62, "r_x1": 66.02, "r_y1": 282.62, "r_x2": 66.02, "r_y2": 274.6, "r_x3": 50.11, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.41, "r_y0": 282.62, "r_x1": 94.94, "r_y1": 282.62, "r_x2": 94.94, "r_y2": 274.6, "r_x3": 68.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.87, "r_y0": 282.62, "r_x1": 127.27, "r_y1": 282.62, "r_x2": 127.27, "r_y2": 274.6, "r_x3": 100.87, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19, "r_y0": 282.62, "r_x1": 165.83, "r_y1": 282.62, "r_x2": 165.83, "r_y2": 274.6, "r_x3": 133.19, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68, "r_y0": 282.62, "r_x1": 194.09, "r_y1": 282.62, "r_x2": 194.09, "r_y2": 274.6, "r_x3": 172.68, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02, "r_y0": 282.62, "r_x1": 211.48, "r_y1": 282.62, "r_x2": 211.48, "r_y2": 274.6, "r_x3": 200.02, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.41, "r_y0": 282.62, "r_x1": 239.44, "r_y1": 282.62, "r_x2": 239.44, "r_y2": 274.6, "r_x3": 217.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 282.62, "r_x1": 264.22, "r_y1": 282.62, "r_x2": 264.22, "r_y2": 274.6, "r_x3": 246.29, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.15, "r_y0": 282.62, "r_x1": 286.36, "r_y1": 282.62, "r_x2": 286.36, "r_y2": 274.6, "r_x3": 270.15, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.58, "r_x1": 286.36, "r_y1": 293.58, "r_x2": 286.36, "r_y2": 285.56, "r_x3": 70.03, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.54, "r_x1": 286.36, "r_y1": 304.54, "r_x2": 286.36, "r_y2": 296.52, "r_x3": 70.03, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.5, "r_x1": 77.5, "r_y1": 315.5, "r_x2": 77.5, "r_y2": 307.48, "r_x3": 70.03, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.35, "r_y0": 315.29, "r_x1": 286.37, "r_y1": 315.29, "r_x2": 286.37, "r_y2": 307.56, "r_x3": 79.35, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 326.25, "r_x1": 147.57, "r_y1": 326.25, "r_x2": 147.57, "r_y2": 318.52, "r_x3": 70.03, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57, "r_y0": 326.45, "r_x1": 271.34, "r_y1": 326.45, "r_x2": 271.34, "r_y2": 318.44, "r_x3": 147.57, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 337.78, "r_x1": 65.37, "r_y1": 337.78, "r_x2": 65.37, "r_y2": 329.76, "r_x3": 50.11, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.66, "r_y0": 337.78, "r_x1": 286.36, "r_y1": 337.78, "r_x2": 286.36, "r_y2": 329.76, "r_x3": 67.66, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.74, "r_x1": 286.36, "r_y1": 348.74, "r_x2": 286.36, "r_y2": 340.72, "r_x3": 70.03, "r_y3": 340.72, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 359.7, "r_x1": 198.82, "r_y1": 359.7, "r_x2": 198.82, "r_y2": 351.68, "r_x3": 70.03, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06, "r_y0": 359.7, "r_x1": 213.53, "r_y1": 359.7, "r_x2": 213.53, "r_y2": 351.68, "r_x3": 206.06, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02, "r_y0": 359.49, "r_x1": 286.36, "r_y1": 359.49, "r_x2": 286.36, "r_y2": 351.76, "r_x3": 217.02, "r_y3": 351.76, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.03, "r_y3": 362.72, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.08, "r_y0": 370.66, "r_x1": 286.36, "r_y1": 370.66, "r_x2": 286.36, "r_y2": 362.64, "r_x3": 143.08, "r_y3": 362.64, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.61, "r_x1": 161.16, "r_y1": 381.61, "r_x2": 161.16, "r_y2": 373.6, "r_x3": 70.03, "r_y3": 373.6, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 392.94, "r_x1": 65.14, "r_y1": 392.94, "r_x2": 65.14, "r_y2": 384.92, "r_x3": 50.11, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.4, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 67.4, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 286.36, "r_y1": 403.9, "r_x2": 286.36, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 414.86, "r_x1": 125.47, "r_y1": 414.86, "r_x2": 125.47, "r_y2": 406.84, "r_x3": 70.03, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.91, "r_y0": 414.86, "r_x1": 230.83, "r_y1": 414.86, "r_x2": 230.83, "r_y2": 406.84, "r_x3": 133.91, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27, "r_y0": 414.86, "r_x1": 286.36, "r_y1": 414.86, "r_x2": 286.36, "r_y2": 406.84, "r_x3": 239.27, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 425.82, "r_x1": 78.96, "r_y1": 425.82, "r_x2": 78.96, "r_y2": 417.8, "r_x3": 70.03, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.25, "r_y0": 425.82, "r_x1": 286.36, "r_y1": 425.82, "r_x2": 286.36, "r_y2": 417.8, "r_x3": 81.25, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.77, "r_x1": 196.76, "r_y1": 436.77, "r_x2": 196.76, "r_y2": 428.76, "r_x3": 70.03, "r_y3": 428.76, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.2, "r_y0": 436.57, "r_x1": 286.36, "r_y1": 436.57, "r_x2": 286.36, "r_y2": 428.84, "r_x3": 200.2, "r_y3": 428.84, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 447.53, "r_x1": 189.19, "r_y1": 447.53, "r_x2": 189.19, "r_y2": 439.8, "r_x3": 70.03, "r_y3": 439.8, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 447.73, "r_x1": 286.36, "r_y1": 447.73, "r_x2": 286.36, "r_y2": 439.72, "r_x3": 189.2, "r_y3": 439.72, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 458.69, "r_x1": 158.92, "r_y1": 458.69, "r_x2": 158.92, "r_y2": 450.68, "r_x3": 70.03, "r_y3": 450.68, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 470.02, "r_x1": 65.91, "r_y1": 470.02, "r_x2": 65.91, "r_y2": 462.0, "r_x3": 50.11, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.28, "r_y0": 470.02, "r_x1": 286.36, "r_y1": 470.02, "r_x2": 286.36, "r_y2": 462.0, "r_x3": 68.28, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 480.97, "r_x1": 116.28, "r_y1": 480.97, "r_x2": 116.28, "r_y2": 472.96, "r_x3": 70.03, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48, "r_y0": 480.97, "r_x1": 286.36, "r_y1": 480.97, "r_x2": 286.36, "r_y2": 472.96, "r_x3": 122.48, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 491.93, "r_x1": 103.31, "r_y1": 491.93, "r_x2": 103.31, "r_y2": 483.92, "r_x3": 70.03, "r_y3": 483.92, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.52, "r_y0": 491.73, "r_x1": 286.36, "r_y1": 491.73, "r_x2": 286.36, "r_y2": 484.0, "r_x3": 105.52, "r_y3": 484.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 502.69, "r_x1": 212.52, "r_y1": 502.69, "r_x2": 212.52, "r_y2": 494.96, "r_x3": 70.03, "r_y3": 494.96, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51, "r_y0": 502.89, "r_x1": 263.56, "r_y1": 502.89, "r_x2": 263.56, "r_y2": 494.88, "r_x3": 212.51, "r_y3": 494.88, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.22, "r_x1": 65.68, "r_y1": 514.22, "r_x2": 65.68, "r_y2": 506.2, "r_x3": 50.11, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.02, "r_y0": 514.22, "r_x1": 247.37, "r_y1": 514.22, "r_x2": 247.37, "r_y2": 506.2, "r_x3": 68.02, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97, "r_y0": 514.22, "r_x1": 286.36, "r_y1": 514.22, "r_x2": 286.36, "r_y2": 506.2, "r_x3": 253.97, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.18, "r_x1": 265.62, "r_y1": 525.18, "r_x2": 265.62, "r_y2": 517.16, "r_x3": 70.03, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.43, "r_y0": 524.97, "r_x1": 286.36, "r_y1": 524.97, "r_x2": 286.36, "r_y2": 517.24, "r_x3": 268.43, "r_y3": 517.24, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 535.93, "r_x1": 286.36, "r_y1": 535.93, "r_x2": 286.36, "r_y2": 528.2, "r_x3": 70.03, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 546.89, "r_x1": 125.26, "r_y1": 546.89, "r_x2": 125.26, "r_y2": 539.16, "r_x3": 70.03, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25, "r_y0": 547.09, "r_x1": 240.05, "r_y1": 547.09, "r_x2": 240.05, "r_y2": 539.08, "r_x3": 125.25, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 558.42, "r_x1": 66.04, "r_y1": 558.42, "r_x2": 66.04, "r_y2": 550.4, "r_x3": 50.11, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.43, "r_y0": 558.42, "r_x1": 286.36, "r_y1": 558.42, "r_x2": 286.36, "r_y2": 550.4, "r_x3": 68.43, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.38, "r_x1": 137.08, "r_y1": 569.38, "r_x2": 137.08, "r_y2": 561.36, "r_x3": 70.03, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 569.38, "r_x1": 172.38, "r_y1": 569.38, "r_x2": 172.38, "r_y2": 561.36, "r_x3": 145.99, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7, "r_y0": 569.38, "r_x1": 286.36, "r_y1": 569.38, "r_x2": 286.36, "r_y2": 561.36, "r_x3": 178.7, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.33, "r_x1": 221.01, "r_y1": 580.33, "r_x2": 221.01, "r_y2": 572.32, "r_x3": 70.03, "r_y3": 572.32, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54, "r_y0": 580.13, "r_x1": 286.36, "r_y1": 580.13, "r_x2": 286.36, "r_y2": 572.4, "r_x3": 232.54, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.09, "r_x1": 135.53, "r_y1": 591.09, "r_x2": 135.53, "r_y2": 583.36, "r_x3": 70.03, "r_y3": 583.36, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53, "r_y0": 591.29, "r_x1": 167.9, "r_y1": 591.29, "r_x2": 167.9, "r_y2": 583.28, "r_x3": 135.53, "r_y3": 583.28, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.62, "r_x1": 65.24, "r_y1": 602.62, "r_x2": 65.24, "r_y2": 594.6, "r_x3": 50.11, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.51, "r_y0": 602.62, "r_x1": 286.36, "r_y1": 602.62, "r_x2": 286.36, "r_y2": 594.6, "r_x3": 67.51, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.58, "r_x1": 109.11, "r_y1": 613.58, "r_x2": 109.11, "r_y2": 605.56, "r_x3": 70.03, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.23, "r_y0": 613.58, "r_x1": 271.77, "r_y1": 613.58, "r_x2": 271.77, "r_y2": 605.56, "r_x3": 116.23, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89, "r_y0": 613.58, "r_x1": 286.36, "r_y1": 613.58, "r_x2": 286.36, "r_y2": 605.56, "r_x3": 278.89, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.33, "r_x1": 286.36, "r_y1": 624.33, "r_x2": 286.36, "r_y2": 616.6, "r_x3": 70.03, "r_y3": 616.6, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.29, "r_x1": 139.1, "r_y1": 635.29, "r_x2": 139.1, "r_y2": 627.56, "r_x3": 70.03, "r_y3": 627.56, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.1, "r_y0": 635.49, "r_x1": 238.96, "r_y1": 635.49, "r_x2": 238.96, "r_y2": 627.48, "r_x3": 139.1, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.82, "r_x1": 65.2, "r_y1": 646.82, "r_x2": 65.2, "r_y2": 638.8, "r_x3": 50.11, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.47, "r_y0": 646.82, "r_x1": 286.36, "r_y1": 646.82, "r_x2": 286.36, "r_y2": 638.8, "r_x3": 67.47, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 657.78, "r_x1": 286.36, "r_y1": 657.78, "r_x2": 286.36, "r_y2": 649.76, "r_x3": 70.03, "r_y3": 649.76, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.74, "r_x1": 286.36, "r_y1": 668.74, "r_x2": 286.36, "r_y2": 660.72, "r_x3": 70.03, "r_y3": 660.72, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.69, "r_x1": 158.46, "r_y1": 679.69, "r_x2": 158.46, "r_y2": 671.68, "r_x3": 70.03, "r_y3": 671.68, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.53, "r_y0": 679.49, "r_x1": 286.36, "r_y1": 679.49, "r_x2": 286.36, "r_y2": 671.76, "r_x3": 160.53, "r_y3": 671.76, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 690.45, "r_x1": 171.42, "r_y1": 690.45, "r_x2": 171.42, "r_y2": 682.72, "r_x3": 70.03, "r_y3": 682.72, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42, "r_y0": 690.65, "r_x1": 212.76, "r_y1": 690.65, "r_x2": 212.76, "r_y2": 682.64, "r_x3": 171.42, "r_y3": 682.64, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.98, "r_x1": 66.51, "r_y1": 701.98, "r_x2": 66.51, "r_y2": 693.96, "r_x3": 50.11, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.97, "r_y0": 701.98, "r_x1": 80.99, "r_y1": 701.98, "r_x2": 80.99, "r_y2": 693.96, "r_x3": 68.97, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.06, "r_y0": 701.98, "r_x1": 114.71, "r_y1": 701.98, "r_x2": 114.71, "r_y2": 693.96, "r_x3": 89.06, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.25, "r_y0": 701.98, "r_x1": 149.15, "r_y1": 701.98, "r_x2": 149.15, "r_y2": 693.96, "r_x3": 124.25, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22, "r_y0": 701.98, "r_x1": 209.37, "r_y1": 701.98, "r_x2": 209.37, "r_y2": 693.96, "r_x3": 157.22, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9, "r_y0": 701.98, "r_x1": 231.85, "r_y1": 701.98, "r_x2": 231.85, "r_y2": 693.96, "r_x3": 218.9, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93, "r_y0": 701.98, "r_x1": 269.32, "r_y1": 701.98, "r_x2": 269.32, "r_y2": 693.96, "r_x3": 239.93, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.39, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 277.39, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 286.36, "r_y1": 712.94, "r_x2": 286.36, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 328.78, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 472.31, "r_y1": 94.86, "r_x2": 472.31, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.89, "r_y0": 94.65, "r_x1": 545.11, "r_y1": 94.65, "r_x2": 545.11, "r_y2": 86.92, "r_x3": 475.89, "r_y3": 86.92, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.61, "r_x1": 371.93, "r_y1": 105.61, "r_x2": 371.93, "r_y2": 97.88, "r_x3": 328.78, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.93, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 371.93, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 417.7, "r_y1": 116.78, "r_x2": 417.7, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 128.73, "r_x1": 324.33, "r_y1": 128.73, "r_x2": 324.33, "r_y2": 120.71, "r_x3": 308.86, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65, "r_y0": 128.73, "r_x1": 545.11, "r_y1": 128.73, "r_x2": 545.11, "r_y2": 120.71, "r_x3": 326.65, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 139.69, "r_x1": 545.11, "r_y1": 139.69, "r_x2": 545.11, "r_y2": 131.67, "r_x3": 328.78, "r_y3": 131.67, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 150.44, "r_x1": 545.11, "r_y1": 150.44, "r_x2": 545.11, "r_y2": 142.71, "r_x3": 328.78, "r_y3": 142.71, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.4, "r_x1": 406.32, "r_y1": 161.4, "r_x2": 406.32, "r_y2": 153.67, "r_x3": 328.78, "r_y3": 153.67, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 161.61, "r_x1": 506.18, "r_y1": 161.61, "r_x2": 506.18, "r_y2": 153.59, "r_x3": 406.32, "r_y3": 153.59, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 15, "label": "text", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 94.86, "coord_origin": "TOPLEFT" }, "confidence": 0.689, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.69, "r_x1": 223.58, "r_y1": 83.69, "r_x2": 223.58, "r_y2": 75.96, "r_x3": 70.03, "r_y3": 75.96, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.58, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 223.58, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 97.92, "r_y1": 94.86, "r_x2": 97.92, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 98.17, "r": 286.37, "b": 160.98, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 106.18, "r_x1": 65.53, "r_y1": 106.18, "r_x2": 65.53, "r_y2": 98.17, "r_x3": 50.11, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 106.18, "r_x1": 286.36, "r_y1": 106.18, "r_x2": 286.36, "r_y2": 98.17, "r_x3": 67.85, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 117.14, "r_x1": 286.36, "r_y1": 117.14, "r_x2": 286.36, "r_y2": 109.12, "r_x3": 70.03, "r_y3": 109.12, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 128.1, "r_x1": 286.36, "r_y1": 128.1, "r_x2": 286.36, "r_y2": 120.08, "r_x3": 70.03, "r_y3": 120.08, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.06, "r_x1": 77.5, "r_y1": 139.06, "r_x2": 77.5, "r_y2": 131.04, "r_x3": 70.03, "r_y3": 131.04, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.56, "r_y0": 138.85, "r_x1": 286.37, "r_y1": 138.85, "r_x2": 286.37, "r_y2": 131.12, "r_x3": 80.56, "r_y3": 131.12, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.81, "r_x1": 195.23, "r_y1": 149.81, "r_x2": 195.23, "r_y2": 142.08, "r_x3": 70.03, "r_y3": 142.08, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.23, "r_y0": 150.02, "r_x1": 286.37, "r_y1": 150.02, "r_x2": 286.37, "r_y2": 142.0, "r_x3": 195.23, "r_y3": 142.0, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 160.98, "r_x1": 120.33, "r_y1": 160.98, "r_x2": 120.33, "r_y2": 152.96, "r_x3": 70.03, "r_y3": 152.96, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 164.28, "r": 286.36, "b": 227.09, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 172.3, "r_x1": 65.53, "r_y1": 172.3, "r_x2": 65.53, "r_y2": 164.28, "r_x3": 50.11, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 172.3, "r_x1": 286.36, "r_y1": 172.3, "r_x2": 286.36, "r_y2": 164.28, "r_x3": 67.85, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.26, "r_x1": 286.36, "r_y1": 183.26, "r_x2": 286.36, "r_y2": 175.24, "r_x3": 70.03, "r_y3": 175.24, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 194.22, "r_x1": 286.36, "r_y1": 194.22, "r_x2": 286.36, "r_y2": 186.2, "r_x3": 70.03, "r_y3": 186.2, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.18, "r_x1": 101.33, "r_y1": 205.18, "r_x2": 101.33, "r_y2": 197.16, "r_x3": 70.03, "r_y3": 197.16, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33, "r_y0": 204.97, "r_x1": 286.36, "r_y1": 204.97, "r_x2": 286.36, "r_y2": 197.24, "r_x3": 104.33, "r_y3": 197.24, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 215.93, "r_x1": 220.49, "r_y1": 215.93, "r_x2": 220.49, "r_y2": 208.2, "r_x3": 70.03, "r_y3": 208.2, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48, "r_y0": 216.14, "r_x1": 286.36, "r_y1": 216.14, "r_x2": 286.36, "r_y2": 208.12, "r_x3": 220.48, "r_y3": 208.12, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.09, "r_x1": 166.65, "r_y1": 227.09, "r_x2": 166.65, "r_y2": 219.08, "r_x3": 70.03, "r_y3": 219.08, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 50.11, "t": 230.4, "r": 286.37, "b": 271.3, "coord_origin": "TOPLEFT" }, "confidence": 0.851, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 238.42, "r_x1": 65.65, "r_y1": 238.42, "r_x2": 65.65, "r_y2": 230.4, "r_x3": 50.11, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 238.42, "r_x1": 286.36, "r_y1": 238.42, "r_x2": 286.36, "r_y2": 230.4, "r_x3": 67.98, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.38, "r_x1": 147.17, "r_y1": 249.38, "r_x2": 147.17, "r_y2": 241.36, "r_x3": 70.03, "r_y3": 241.36, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93, "r_y0": 249.17, "r_x1": 286.37, "r_y1": 249.17, "r_x2": 286.37, "r_y2": 241.44, "r_x3": 149.93, "r_y3": 241.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.13, "r_x1": 244.69, "r_y1": 260.13, "r_x2": 244.69, "r_y2": 252.4, "r_x3": 70.03, "r_y3": 252.4, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69, "r_y0": 260.34, "r_x1": 286.36, "r_y1": 260.34, "r_x2": 286.36, "r_y2": 252.32, "r_x3": 244.69, "r_y3": 252.32, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.3, "r_x1": 111.37, "r_y1": 271.3, "r_x2": 111.37, "r_y2": 263.28, "r_x3": 70.03, "r_y3": 263.28, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 274.6, "r": 286.37, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 282.62, "r_x1": 66.02, "r_y1": 282.62, "r_x2": 66.02, "r_y2": 274.6, "r_x3": 50.11, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.41, "r_y0": 282.62, "r_x1": 94.94, "r_y1": 282.62, "r_x2": 94.94, "r_y2": 274.6, "r_x3": 68.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.87, "r_y0": 282.62, "r_x1": 127.27, "r_y1": 282.62, "r_x2": 127.27, "r_y2": 274.6, "r_x3": 100.87, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19, "r_y0": 282.62, "r_x1": 165.83, "r_y1": 282.62, "r_x2": 165.83, "r_y2": 274.6, "r_x3": 133.19, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68, "r_y0": 282.62, "r_x1": 194.09, "r_y1": 282.62, "r_x2": 194.09, "r_y2": 274.6, "r_x3": 172.68, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02, "r_y0": 282.62, "r_x1": 211.48, "r_y1": 282.62, "r_x2": 211.48, "r_y2": 274.6, "r_x3": 200.02, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.41, "r_y0": 282.62, "r_x1": 239.44, "r_y1": 282.62, "r_x2": 239.44, "r_y2": 274.6, "r_x3": 217.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 282.62, "r_x1": 264.22, "r_y1": 282.62, "r_x2": 264.22, "r_y2": 274.6, "r_x3": 246.29, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.15, "r_y0": 282.62, "r_x1": 286.36, "r_y1": 282.62, "r_x2": 286.36, "r_y2": 274.6, "r_x3": 270.15, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.58, "r_x1": 286.36, "r_y1": 293.58, "r_x2": 286.36, "r_y2": 285.56, "r_x3": 70.03, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.54, "r_x1": 286.36, "r_y1": 304.54, "r_x2": 286.36, "r_y2": 296.52, "r_x3": 70.03, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.5, "r_x1": 77.5, "r_y1": 315.5, "r_x2": 77.5, "r_y2": 307.48, "r_x3": 70.03, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.35, "r_y0": 315.29, "r_x1": 286.37, "r_y1": 315.29, "r_x2": 286.37, "r_y2": 307.56, "r_x3": 79.35, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 326.25, "r_x1": 147.57, "r_y1": 326.25, "r_x2": 147.57, "r_y2": 318.52, "r_x3": 70.03, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57, "r_y0": 326.45, "r_x1": 271.34, "r_y1": 326.45, "r_x2": 271.34, "r_y2": 318.44, "r_x3": 147.57, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 50.11, "t": 329.76, "r": 286.36, "b": 381.61, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 337.78, "r_x1": 65.37, "r_y1": 337.78, "r_x2": 65.37, "r_y2": 329.76, "r_x3": 50.11, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.66, "r_y0": 337.78, "r_x1": 286.36, "r_y1": 337.78, "r_x2": 286.36, "r_y2": 329.76, "r_x3": 67.66, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.74, "r_x1": 286.36, "r_y1": 348.74, "r_x2": 286.36, "r_y2": 340.72, "r_x3": 70.03, "r_y3": 340.72, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 359.7, "r_x1": 198.82, "r_y1": 359.7, "r_x2": 198.82, "r_y2": 351.68, "r_x3": 70.03, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06, "r_y0": 359.7, "r_x1": 213.53, "r_y1": 359.7, "r_x2": 213.53, "r_y2": 351.68, "r_x3": 206.06, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02, "r_y0": 359.49, "r_x1": 286.36, "r_y1": 359.49, "r_x2": 286.36, "r_y2": 351.76, "r_x3": 217.02, "r_y3": 351.76, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.03, "r_y3": 362.72, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.08, "r_y0": 370.66, "r_x1": 286.36, "r_y1": 370.66, "r_x2": 286.36, "r_y2": 362.64, "r_x3": 143.08, "r_y3": 362.64, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.61, "r_x1": 161.16, "r_y1": 381.61, "r_x2": 161.16, "r_y2": 373.6, "r_x3": 70.03, "r_y3": 373.6, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 50.11, "t": 384.92, "r": 286.36, "b": 458.69, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 392.94, "r_x1": 65.14, "r_y1": 392.94, "r_x2": 65.14, "r_y2": 384.92, "r_x3": 50.11, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.4, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 67.4, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 286.36, "r_y1": 403.9, "r_x2": 286.36, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 414.86, "r_x1": 125.47, "r_y1": 414.86, "r_x2": 125.47, "r_y2": 406.84, "r_x3": 70.03, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.91, "r_y0": 414.86, "r_x1": 230.83, "r_y1": 414.86, "r_x2": 230.83, "r_y2": 406.84, "r_x3": 133.91, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27, "r_y0": 414.86, "r_x1": 286.36, "r_y1": 414.86, "r_x2": 286.36, "r_y2": 406.84, "r_x3": 239.27, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 425.82, "r_x1": 78.96, "r_y1": 425.82, "r_x2": 78.96, "r_y2": 417.8, "r_x3": 70.03, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.25, "r_y0": 425.82, "r_x1": 286.36, "r_y1": 425.82, "r_x2": 286.36, "r_y2": 417.8, "r_x3": 81.25, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.77, "r_x1": 196.76, "r_y1": 436.77, "r_x2": 196.76, "r_y2": 428.76, "r_x3": 70.03, "r_y3": 428.76, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.2, "r_y0": 436.57, "r_x1": 286.36, "r_y1": 436.57, "r_x2": 286.36, "r_y2": 428.84, "r_x3": 200.2, "r_y3": 428.84, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 447.53, "r_x1": 189.19, "r_y1": 447.53, "r_x2": 189.19, "r_y2": 439.8, "r_x3": 70.03, "r_y3": 439.8, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 447.73, "r_x1": 286.36, "r_y1": 447.73, "r_x2": 286.36, "r_y2": 439.72, "r_x3": 189.2, "r_y3": 439.72, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 458.69, "r_x1": 158.92, "r_y1": 458.69, "r_x2": 158.92, "r_y2": 450.68, "r_x3": 70.03, "r_y3": 450.68, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 50.11, "t": 462.0, "r": 286.36, "b": 502.89, "coord_origin": "TOPLEFT" }, "confidence": 0.843, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 470.02, "r_x1": 65.91, "r_y1": 470.02, "r_x2": 65.91, "r_y2": 462.0, "r_x3": 50.11, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.28, "r_y0": 470.02, "r_x1": 286.36, "r_y1": 470.02, "r_x2": 286.36, "r_y2": 462.0, "r_x3": 68.28, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 480.97, "r_x1": 116.28, "r_y1": 480.97, "r_x2": 116.28, "r_y2": 472.96, "r_x3": 70.03, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48, "r_y0": 480.97, "r_x1": 286.36, "r_y1": 480.97, "r_x2": 286.36, "r_y2": 472.96, "r_x3": 122.48, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 491.93, "r_x1": 103.31, "r_y1": 491.93, "r_x2": 103.31, "r_y2": 483.92, "r_x3": 70.03, "r_y3": 483.92, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.52, "r_y0": 491.73, "r_x1": 286.36, "r_y1": 491.73, "r_x2": 286.36, "r_y2": 484.0, "r_x3": 105.52, "r_y3": 484.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 502.69, "r_x1": 212.52, "r_y1": 502.69, "r_x2": 212.52, "r_y2": 494.96, "r_x3": 70.03, "r_y3": 494.96, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51, "r_y0": 502.89, "r_x1": 263.56, "r_y1": 502.89, "r_x2": 263.56, "r_y2": 494.88, "r_x3": 212.51, "r_y3": 494.88, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 50.11, "t": 506.2, "r": 286.36, "b": 547.09, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.22, "r_x1": 65.68, "r_y1": 514.22, "r_x2": 65.68, "r_y2": 506.2, "r_x3": 50.11, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.02, "r_y0": 514.22, "r_x1": 247.37, "r_y1": 514.22, "r_x2": 247.37, "r_y2": 506.2, "r_x3": 68.02, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97, "r_y0": 514.22, "r_x1": 286.36, "r_y1": 514.22, "r_x2": 286.36, "r_y2": 506.2, "r_x3": 253.97, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.18, "r_x1": 265.62, "r_y1": 525.18, "r_x2": 265.62, "r_y2": 517.16, "r_x3": 70.03, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.43, "r_y0": 524.97, "r_x1": 286.36, "r_y1": 524.97, "r_x2": 286.36, "r_y2": 517.24, "r_x3": 268.43, "r_y3": 517.24, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 535.93, "r_x1": 286.36, "r_y1": 535.93, "r_x2": 286.36, "r_y2": 528.2, "r_x3": 70.03, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 546.89, "r_x1": 125.26, "r_y1": 546.89, "r_x2": 125.26, "r_y2": 539.16, "r_x3": 70.03, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25, "r_y0": 547.09, "r_x1": 240.05, "r_y1": 547.09, "r_x2": 240.05, "r_y2": 539.08, "r_x3": 125.25, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 550.4, "r": 286.36, "b": 591.29, "coord_origin": "TOPLEFT" }, "confidence": 0.824, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 558.42, "r_x1": 66.04, "r_y1": 558.42, "r_x2": 66.04, "r_y2": 550.4, "r_x3": 50.11, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.43, "r_y0": 558.42, "r_x1": 286.36, "r_y1": 558.42, "r_x2": 286.36, "r_y2": 550.4, "r_x3": 68.43, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.38, "r_x1": 137.08, "r_y1": 569.38, "r_x2": 137.08, "r_y2": 561.36, "r_x3": 70.03, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 569.38, "r_x1": 172.38, "r_y1": 569.38, "r_x2": 172.38, "r_y2": 561.36, "r_x3": 145.99, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7, "r_y0": 569.38, "r_x1": 286.36, "r_y1": 569.38, "r_x2": 286.36, "r_y2": 561.36, "r_x3": 178.7, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.33, "r_x1": 221.01, "r_y1": 580.33, "r_x2": 221.01, "r_y2": 572.32, "r_x3": 70.03, "r_y3": 572.32, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54, "r_y0": 580.13, "r_x1": 286.36, "r_y1": 580.13, "r_x2": 286.36, "r_y2": 572.4, "r_x3": 232.54, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.09, "r_x1": 135.53, "r_y1": 591.09, "r_x2": 135.53, "r_y2": 583.36, "r_x3": 70.03, "r_y3": 583.36, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53, "r_y0": 591.29, "r_x1": 167.9, "r_y1": 591.29, "r_x2": 167.9, "r_y2": 583.28, "r_x3": 135.53, "r_y3": 583.28, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 594.6, "r": 286.36, "b": 635.49, "coord_origin": "TOPLEFT" }, "confidence": 0.836, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.62, "r_x1": 65.24, "r_y1": 602.62, "r_x2": 65.24, "r_y2": 594.6, "r_x3": 50.11, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.51, "r_y0": 602.62, "r_x1": 286.36, "r_y1": 602.62, "r_x2": 286.36, "r_y2": 594.6, "r_x3": 67.51, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.58, "r_x1": 109.11, "r_y1": 613.58, "r_x2": 109.11, "r_y2": 605.56, "r_x3": 70.03, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.23, "r_y0": 613.58, "r_x1": 271.77, "r_y1": 613.58, "r_x2": 271.77, "r_y2": 605.56, "r_x3": 116.23, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89, "r_y0": 613.58, "r_x1": 286.36, "r_y1": 613.58, "r_x2": 286.36, "r_y2": 605.56, "r_x3": 278.89, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.33, "r_x1": 286.36, "r_y1": 624.33, "r_x2": 286.36, "r_y2": 616.6, "r_x3": 70.03, "r_y3": 616.6, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.29, "r_x1": 139.1, "r_y1": 635.29, "r_x2": 139.1, "r_y2": 627.56, "r_x3": 70.03, "r_y3": 627.56, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.1, "r_y0": 635.49, "r_x1": 238.96, "r_y1": 635.49, "r_x2": 238.96, "r_y2": 627.48, "r_x3": 139.1, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 50.11, "t": 638.8, "r": 286.36, "b": 690.65, "coord_origin": "TOPLEFT" }, "confidence": 0.808, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.82, "r_x1": 65.2, "r_y1": 646.82, "r_x2": 65.2, "r_y2": 638.8, "r_x3": 50.11, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.47, "r_y0": 646.82, "r_x1": 286.36, "r_y1": 646.82, "r_x2": 286.36, "r_y2": 638.8, "r_x3": 67.47, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 657.78, "r_x1": 286.36, "r_y1": 657.78, "r_x2": 286.36, "r_y2": 649.76, "r_x3": 70.03, "r_y3": 649.76, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.74, "r_x1": 286.36, "r_y1": 668.74, "r_x2": 286.36, "r_y2": 660.72, "r_x3": 70.03, "r_y3": 660.72, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.69, "r_x1": 158.46, "r_y1": 679.69, "r_x2": 158.46, "r_y2": 671.68, "r_x3": 70.03, "r_y3": 671.68, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.53, "r_y0": 679.49, "r_x1": 286.36, "r_y1": 679.49, "r_x2": 286.36, "r_y2": 671.76, "r_x3": 160.53, "r_y3": 671.76, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 690.45, "r_x1": 171.42, "r_y1": 690.45, "r_x2": 171.42, "r_y2": 682.72, "r_x3": 70.03, "r_y3": 682.72, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42, "r_y0": 690.65, "r_x1": 212.76, "r_y1": 690.65, "r_x2": 212.76, "r_y2": 682.64, "r_x3": 171.42, "r_y3": 682.64, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 693.96, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.839, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.98, "r_x1": 66.51, "r_y1": 701.98, "r_x2": 66.51, "r_y2": 693.96, "r_x3": 50.11, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.97, "r_y0": 701.98, "r_x1": 80.99, "r_y1": 701.98, "r_x2": 80.99, "r_y2": 693.96, "r_x3": 68.97, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.06, "r_y0": 701.98, "r_x1": 114.71, "r_y1": 701.98, "r_x2": 114.71, "r_y2": 693.96, "r_x3": 89.06, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.25, "r_y0": 701.98, "r_x1": 149.15, "r_y1": 701.98, "r_x2": 149.15, "r_y2": 693.96, "r_x3": 124.25, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22, "r_y0": 701.98, "r_x1": 209.37, "r_y1": 701.98, "r_x2": 209.37, "r_y2": 693.96, "r_x3": 157.22, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9, "r_y0": 701.98, "r_x1": 231.85, "r_y1": 701.98, "r_x2": 231.85, "r_y2": 693.96, "r_x3": 218.9, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93, "r_y0": 701.98, "r_x1": 269.32, "r_y1": 701.98, "r_x2": 269.32, "r_y2": 693.96, "r_x3": 239.93, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.39, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 277.39, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 286.36, "r_y1": 712.94, "r_x2": 286.36, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "list_item", "bbox": { "l": 328.78, "t": 75.88, "r": 545.11, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.756, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 328.78, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 472.31, "r_y1": 94.86, "r_x2": 472.31, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.89, "r_y0": 94.65, "r_x1": 545.11, "r_y1": 94.65, "r_x2": 545.11, "r_y2": 86.92, "r_x3": 475.89, "r_y3": 86.92, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.61, "r_x1": 371.93, "r_y1": 105.61, "r_x2": 371.93, "r_y2": 97.88, "r_x3": 328.78, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.93, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 371.93, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 417.7, "r_y1": 116.78, "r_x2": 417.7, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 120.71, "r": 545.11, "b": 161.61, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 128.73, "r_x1": 324.33, "r_y1": 128.73, "r_x2": 324.33, "r_y2": 120.71, "r_x3": 308.86, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65, "r_y0": 128.73, "r_x1": 545.11, "r_y1": 128.73, "r_x2": 545.11, "r_y2": 120.71, "r_x3": 326.65, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 139.69, "r_x1": 545.11, "r_y1": 139.69, "r_x2": 545.11, "r_y2": 131.67, "r_x3": 328.78, "r_y3": 131.67, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 150.44, "r_x1": 545.11, "r_y1": 150.44, "r_x2": 545.11, "r_y2": 142.71, "r_x3": 328.78, "r_y3": 142.71, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.4, "r_x1": 406.32, "r_y1": 161.4, "r_x2": 406.32, "r_y2": 153.67, "r_x3": 328.78, "r_y3": 153.67, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 161.61, "r_x1": 506.18, "r_y1": 161.61, "r_x2": 506.18, "r_y2": 153.59, "r_x3": 406.32, "r_y3": 153.59, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.907, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 15, "page_no": 9, "cluster": { "id": 15, "label": "text", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 94.86, "coord_origin": "TOPLEFT" }, "confidence": 0.689, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.69, "r_x1": 223.58, "r_y1": 83.69, "r_x2": 223.58, "r_y2": 75.96, "r_x3": 70.03, "r_y3": 75.96, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.58, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 223.58, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 97.92, "r_y1": 94.86, "r_x2": 97.92, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6" }, { "label": "list_item", "id": 13, "page_no": 9, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 98.17, "r": 286.37, "b": 160.98, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 106.18, "r_x1": 65.53, "r_y1": 106.18, "r_x2": 65.53, "r_y2": 98.17, "r_x3": 50.11, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 106.18, "r_x1": 286.36, "r_y1": 106.18, "r_x2": 286.36, "r_y2": 98.17, "r_x3": 67.85, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 117.14, "r_x1": 286.36, "r_y1": 117.14, "r_x2": 286.36, "r_y2": 109.12, "r_x3": 70.03, "r_y3": 109.12, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 128.1, "r_x1": 286.36, "r_y1": 128.1, "r_x2": 286.36, "r_y2": 120.08, "r_x3": 70.03, "r_y3": 120.08, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.06, "r_x1": 77.5, "r_y1": 139.06, "r_x2": 77.5, "r_y2": 131.04, "r_x3": 70.03, "r_y3": 131.04, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.56, "r_y0": 138.85, "r_x1": 286.37, "r_y1": 138.85, "r_x2": 286.37, "r_y2": 131.12, "r_x3": 80.56, "r_y3": 131.12, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.81, "r_x1": 195.23, "r_y1": 149.81, "r_x2": 195.23, "r_y2": 142.08, "r_x3": 70.03, "r_y3": 142.08, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.23, "r_y0": 150.02, "r_x1": 286.37, "r_y1": 150.02, "r_x2": 286.37, "r_y2": 142.0, "r_x3": 195.23, "r_y3": 142.0, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 160.98, "r_x1": 120.33, "r_y1": 160.98, "r_x2": 120.33, "r_y2": 152.96, "r_x3": 70.03, "r_y3": 152.96, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1" }, { "label": "list_item", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 164.28, "r": 286.36, "b": 227.09, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 172.3, "r_x1": 65.53, "r_y1": 172.3, "r_x2": 65.53, "r_y2": 164.28, "r_x3": 50.11, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 172.3, "r_x1": 286.36, "r_y1": 172.3, "r_x2": 286.36, "r_y2": 164.28, "r_x3": 67.85, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.26, "r_x1": 286.36, "r_y1": 183.26, "r_x2": 286.36, "r_y2": 175.24, "r_x3": 70.03, "r_y3": 175.24, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 194.22, "r_x1": 286.36, "r_y1": 194.22, "r_x2": 286.36, "r_y2": 186.2, "r_x3": 70.03, "r_y3": 186.2, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.18, "r_x1": 101.33, "r_y1": 205.18, "r_x2": 101.33, "r_y2": 197.16, "r_x3": 70.03, "r_y3": 197.16, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33, "r_y0": 204.97, "r_x1": 286.36, "r_y1": 204.97, "r_x2": 286.36, "r_y2": 197.24, "r_x3": 104.33, "r_y3": 197.24, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 215.93, "r_x1": 220.49, "r_y1": 215.93, "r_x2": 220.49, "r_y2": 208.2, "r_x3": 70.03, "r_y3": 208.2, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48, "r_y0": 216.14, "r_x1": 286.36, "r_y1": 216.14, "r_x2": 286.36, "r_y2": 208.12, "r_x3": 220.48, "r_y3": 208.12, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.09, "r_x1": 166.65, "r_y1": 227.09, "r_x2": 166.65, "r_y2": 219.08, "r_x3": 70.03, "r_y3": 219.08, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3" }, { "label": "list_item", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 50.11, "t": 230.4, "r": 286.37, "b": 271.3, "coord_origin": "TOPLEFT" }, "confidence": 0.851, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 238.42, "r_x1": 65.65, "r_y1": 238.42, "r_x2": 65.65, "r_y2": 230.4, "r_x3": 50.11, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 238.42, "r_x1": 286.36, "r_y1": 238.42, "r_x2": 286.36, "r_y2": 230.4, "r_x3": 67.98, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.38, "r_x1": 147.17, "r_y1": 249.38, "r_x2": 147.17, "r_y2": 241.36, "r_x3": 70.03, "r_y3": 241.36, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93, "r_y0": 249.17, "r_x1": 286.37, "r_y1": 249.17, "r_x2": 286.37, "r_y2": 241.44, "r_x3": 149.93, "r_y3": 241.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.13, "r_x1": 244.69, "r_y1": 260.13, "r_x2": 244.69, "r_y2": 252.4, "r_x3": 70.03, "r_y3": 252.4, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69, "r_y0": 260.34, "r_x1": 286.36, "r_y1": 260.34, "r_x2": 286.36, "r_y2": 252.32, "r_x3": 244.69, "r_y3": 252.32, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.3, "r_x1": 111.37, "r_y1": 271.3, "r_x2": 111.37, "r_y2": 263.28, "r_x3": 70.03, "r_y3": 263.28, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2" }, { "label": "list_item", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 274.6, "r": 286.37, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 282.62, "r_x1": 66.02, "r_y1": 282.62, "r_x2": 66.02, "r_y2": 274.6, "r_x3": 50.11, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.41, "r_y0": 282.62, "r_x1": 94.94, "r_y1": 282.62, "r_x2": 94.94, "r_y2": 274.6, "r_x3": 68.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.87, "r_y0": 282.62, "r_x1": 127.27, "r_y1": 282.62, "r_x2": 127.27, "r_y2": 274.6, "r_x3": 100.87, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19, "r_y0": 282.62, "r_x1": 165.83, "r_y1": 282.62, "r_x2": 165.83, "r_y2": 274.6, "r_x3": 133.19, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68, "r_y0": 282.62, "r_x1": 194.09, "r_y1": 282.62, "r_x2": 194.09, "r_y2": 274.6, "r_x3": 172.68, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02, "r_y0": 282.62, "r_x1": 211.48, "r_y1": 282.62, "r_x2": 211.48, "r_y2": 274.6, "r_x3": 200.02, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.41, "r_y0": 282.62, "r_x1": 239.44, "r_y1": 282.62, "r_x2": 239.44, "r_y2": 274.6, "r_x3": 217.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 282.62, "r_x1": 264.22, "r_y1": 282.62, "r_x2": 264.22, "r_y2": 274.6, "r_x3": 246.29, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.15, "r_y0": 282.62, "r_x1": 286.36, "r_y1": 282.62, "r_x2": 286.36, "r_y2": 274.6, "r_x3": 270.15, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.58, "r_x1": 286.36, "r_y1": 293.58, "r_x2": 286.36, "r_y2": 285.56, "r_x3": 70.03, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.54, "r_x1": 286.36, "r_y1": 304.54, "r_x2": 286.36, "r_y2": 296.52, "r_x3": 70.03, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.5, "r_x1": 77.5, "r_y1": 315.5, "r_x2": 77.5, "r_y2": 307.48, "r_x3": 70.03, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.35, "r_y0": 315.29, "r_x1": 286.37, "r_y1": 315.29, "r_x2": 286.37, "r_y2": 307.56, "r_x3": 79.35, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 326.25, "r_x1": 147.57, "r_y1": 326.25, "r_x2": 147.57, "r_y2": 318.52, "r_x3": 70.03, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57, "r_y0": 326.45, "r_x1": 271.34, "r_y1": 326.45, "r_x2": 271.34, "r_y2": 318.44, "r_x3": 147.57, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3" }, { "label": "list_item", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 50.11, "t": 329.76, "r": 286.36, "b": 381.61, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 337.78, "r_x1": 65.37, "r_y1": 337.78, "r_x2": 65.37, "r_y2": 329.76, "r_x3": 50.11, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.66, "r_y0": 337.78, "r_x1": 286.36, "r_y1": 337.78, "r_x2": 286.36, "r_y2": 329.76, "r_x3": 67.66, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.74, "r_x1": 286.36, "r_y1": 348.74, "r_x2": 286.36, "r_y2": 340.72, "r_x3": 70.03, "r_y3": 340.72, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 359.7, "r_x1": 198.82, "r_y1": 359.7, "r_x2": 198.82, "r_y2": 351.68, "r_x3": 70.03, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06, "r_y0": 359.7, "r_x1": 213.53, "r_y1": 359.7, "r_x2": 213.53, "r_y2": 351.68, "r_x3": 206.06, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02, "r_y0": 359.49, "r_x1": 286.36, "r_y1": 359.49, "r_x2": 286.36, "r_y2": 351.76, "r_x3": 217.02, "r_y3": 351.76, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.03, "r_y3": 362.72, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.08, "r_y0": 370.66, "r_x1": 286.36, "r_y1": 370.66, "r_x2": 286.36, "r_y2": 362.64, "r_x3": 143.08, "r_y3": 362.64, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.61, "r_x1": 161.16, "r_y1": 381.61, "r_x2": 161.16, "r_y2": 373.6, "r_x3": 70.03, "r_y3": 373.6, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1" }, { "label": "list_item", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 50.11, "t": 384.92, "r": 286.36, "b": 458.69, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 392.94, "r_x1": 65.14, "r_y1": 392.94, "r_x2": 65.14, "r_y2": 384.92, "r_x3": 50.11, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.4, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 67.4, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 286.36, "r_y1": 403.9, "r_x2": 286.36, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 414.86, "r_x1": 125.47, "r_y1": 414.86, "r_x2": 125.47, "r_y2": 406.84, "r_x3": 70.03, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.91, "r_y0": 414.86, "r_x1": 230.83, "r_y1": 414.86, "r_x2": 230.83, "r_y2": 406.84, "r_x3": 133.91, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27, "r_y0": 414.86, "r_x1": 286.36, "r_y1": 414.86, "r_x2": 286.36, "r_y2": 406.84, "r_x3": 239.27, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 425.82, "r_x1": 78.96, "r_y1": 425.82, "r_x2": 78.96, "r_y2": 417.8, "r_x3": 70.03, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.25, "r_y0": 425.82, "r_x1": 286.36, "r_y1": 425.82, "r_x2": 286.36, "r_y2": 417.8, "r_x3": 81.25, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.77, "r_x1": 196.76, "r_y1": 436.77, "r_x2": 196.76, "r_y2": 428.76, "r_x3": 70.03, "r_y3": 428.76, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.2, "r_y0": 436.57, "r_x1": 286.36, "r_y1": 436.57, "r_x2": 286.36, "r_y2": 428.84, "r_x3": 200.2, "r_y3": 428.84, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 447.53, "r_x1": 189.19, "r_y1": 447.53, "r_x2": 189.19, "r_y2": 439.8, "r_x3": 70.03, "r_y3": 439.8, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 447.73, "r_x1": 286.36, "r_y1": 447.73, "r_x2": 286.36, "r_y2": 439.72, "r_x3": 189.2, "r_y3": 439.72, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 458.69, "r_x1": 158.92, "r_y1": 458.69, "r_x2": 158.92, "r_y2": 450.68, "r_x3": 70.03, "r_y3": 450.68, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5" }, { "label": "list_item", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 50.11, "t": 462.0, "r": 286.36, "b": 502.89, "coord_origin": "TOPLEFT" }, "confidence": 0.843, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 470.02, "r_x1": 65.91, "r_y1": 470.02, "r_x2": 65.91, "r_y2": 462.0, "r_x3": 50.11, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.28, "r_y0": 470.02, "r_x1": 286.36, "r_y1": 470.02, "r_x2": 286.36, "r_y2": 462.0, "r_x3": 68.28, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 480.97, "r_x1": 116.28, "r_y1": 480.97, "r_x2": 116.28, "r_y2": 472.96, "r_x3": 70.03, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48, "r_y0": 480.97, "r_x1": 286.36, "r_y1": 480.97, "r_x2": 286.36, "r_y2": 472.96, "r_x3": 122.48, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 491.93, "r_x1": 103.31, "r_y1": 491.93, "r_x2": 103.31, "r_y2": 483.92, "r_x3": 70.03, "r_y3": 483.92, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.52, "r_y0": 491.73, "r_x1": 286.36, "r_y1": 491.73, "r_x2": 286.36, "r_y2": 484.0, "r_x3": 105.52, "r_y3": 484.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 502.69, "r_x1": 212.52, "r_y1": 502.69, "r_x2": 212.52, "r_y2": 494.96, "r_x3": 70.03, "r_y3": 494.96, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51, "r_y0": 502.89, "r_x1": 263.56, "r_y1": 502.89, "r_x2": 263.56, "r_y2": 494.88, "r_x3": 212.51, "r_y3": 494.88, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2" }, { "label": "list_item", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 50.11, "t": 506.2, "r": 286.36, "b": 547.09, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.22, "r_x1": 65.68, "r_y1": 514.22, "r_x2": 65.68, "r_y2": 506.2, "r_x3": 50.11, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.02, "r_y0": 514.22, "r_x1": 247.37, "r_y1": 514.22, "r_x2": 247.37, "r_y2": 506.2, "r_x3": 68.02, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97, "r_y0": 514.22, "r_x1": 286.36, "r_y1": 514.22, "r_x2": 286.36, "r_y2": 506.2, "r_x3": 253.97, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.18, "r_x1": 265.62, "r_y1": 525.18, "r_x2": 265.62, "r_y2": 517.16, "r_x3": 70.03, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.43, "r_y0": 524.97, "r_x1": 286.36, "r_y1": 524.97, "r_x2": 286.36, "r_y2": 517.24, "r_x3": 268.43, "r_y3": 517.24, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 535.93, "r_x1": 286.36, "r_y1": 535.93, "r_x2": 286.36, "r_y2": 528.2, "r_x3": 70.03, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 546.89, "r_x1": 125.26, "r_y1": 546.89, "r_x2": 125.26, "r_y2": 539.16, "r_x3": 70.03, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25, "r_y0": 547.09, "r_x1": 240.05, "r_y1": 547.09, "r_x2": 240.05, "r_y2": 539.08, "r_x3": 125.25, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3" }, { "label": "list_item", "id": 11, "page_no": 9, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 550.4, "r": 286.36, "b": 591.29, "coord_origin": "TOPLEFT" }, "confidence": 0.824, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 558.42, "r_x1": 66.04, "r_y1": 558.42, "r_x2": 66.04, "r_y2": 550.4, "r_x3": 50.11, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.43, "r_y0": 558.42, "r_x1": 286.36, "r_y1": 558.42, "r_x2": 286.36, "r_y2": 550.4, "r_x3": 68.43, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.38, "r_x1": 137.08, "r_y1": 569.38, "r_x2": 137.08, "r_y2": 561.36, "r_x3": 70.03, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 569.38, "r_x1": 172.38, "r_y1": 569.38, "r_x2": 172.38, "r_y2": 561.36, "r_x3": 145.99, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7, "r_y0": 569.38, "r_x1": 286.36, "r_y1": 569.38, "r_x2": 286.36, "r_y2": 561.36, "r_x3": 178.7, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.33, "r_x1": 221.01, "r_y1": 580.33, "r_x2": 221.01, "r_y2": 572.32, "r_x3": 70.03, "r_y3": 572.32, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54, "r_y0": 580.13, "r_x1": 286.36, "r_y1": 580.13, "r_x2": 286.36, "r_y2": 572.4, "r_x3": 232.54, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.09, "r_x1": 135.53, "r_y1": 591.09, "r_x2": 135.53, "r_y2": 583.36, "r_x3": 70.03, "r_y3": 583.36, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53, "r_y0": 591.29, "r_x1": 167.9, "r_y1": 591.29, "r_x2": 167.9, "r_y2": 583.28, "r_x3": 135.53, "r_y3": 583.28, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3" }, { "label": "list_item", "id": 10, "page_no": 9, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 594.6, "r": 286.36, "b": 635.49, "coord_origin": "TOPLEFT" }, "confidence": 0.836, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.62, "r_x1": 65.24, "r_y1": 602.62, "r_x2": 65.24, "r_y2": 594.6, "r_x3": 50.11, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.51, "r_y0": 602.62, "r_x1": 286.36, "r_y1": 602.62, "r_x2": 286.36, "r_y2": 594.6, "r_x3": 67.51, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.58, "r_x1": 109.11, "r_y1": 613.58, "r_x2": 109.11, "r_y2": 605.56, "r_x3": 70.03, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.23, "r_y0": 613.58, "r_x1": 271.77, "r_y1": 613.58, "r_x2": 271.77, "r_y2": 605.56, "r_x3": 116.23, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89, "r_y0": 613.58, "r_x1": 286.36, "r_y1": 613.58, "r_x2": 286.36, "r_y2": 605.56, "r_x3": 278.89, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.33, "r_x1": 286.36, "r_y1": 624.33, "r_x2": 286.36, "r_y2": 616.6, "r_x3": 70.03, "r_y3": 616.6, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.29, "r_x1": 139.1, "r_y1": 635.29, "r_x2": 139.1, "r_y2": 627.56, "r_x3": 70.03, "r_y3": 627.56, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.1, "r_y0": 635.49, "r_x1": 238.96, "r_y1": 635.49, "r_x2": 238.96, "r_y2": 627.48, "r_x3": 139.1, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4" }, { "label": "list_item", "id": 12, "page_no": 9, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 50.11, "t": 638.8, "r": 286.36, "b": 690.65, "coord_origin": "TOPLEFT" }, "confidence": 0.808, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.82, "r_x1": 65.2, "r_y1": 646.82, "r_x2": 65.2, "r_y2": 638.8, "r_x3": 50.11, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.47, "r_y0": 646.82, "r_x1": 286.36, "r_y1": 646.82, "r_x2": 286.36, "r_y2": 638.8, "r_x3": 67.47, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 657.78, "r_x1": 286.36, "r_y1": 657.78, "r_x2": 286.36, "r_y2": 649.76, "r_x3": 70.03, "r_y3": 649.76, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.74, "r_x1": 286.36, "r_y1": 668.74, "r_x2": 286.36, "r_y2": 660.72, "r_x3": 70.03, "r_y3": 660.72, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.69, "r_x1": 158.46, "r_y1": 679.69, "r_x2": 158.46, "r_y2": 671.68, "r_x3": 70.03, "r_y3": 671.68, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.53, "r_y0": 679.49, "r_x1": 286.36, "r_y1": 679.49, "r_x2": 286.36, "r_y2": 671.76, "r_x3": 160.53, "r_y3": 671.76, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 690.45, "r_x1": 171.42, "r_y1": 690.45, "r_x2": 171.42, "r_y2": 682.72, "r_x3": 70.03, "r_y3": 682.72, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42, "r_y0": 690.65, "r_x1": 212.76, "r_y1": 690.65, "r_x2": 212.76, "r_y2": 682.64, "r_x3": 171.42, "r_y3": 682.64, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 9, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 693.96, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.839, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.98, "r_x1": 66.51, "r_y1": 701.98, "r_x2": 66.51, "r_y2": 693.96, "r_x3": 50.11, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.97, "r_y0": 701.98, "r_x1": 80.99, "r_y1": 701.98, "r_x2": 80.99, "r_y2": 693.96, "r_x3": 68.97, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.06, "r_y0": 701.98, "r_x1": 114.71, "r_y1": 701.98, "r_x2": 114.71, "r_y2": 693.96, "r_x3": 89.06, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.25, "r_y0": 701.98, "r_x1": 149.15, "r_y1": 701.98, "r_x2": 149.15, "r_y2": 693.96, "r_x3": 124.25, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22, "r_y0": 701.98, "r_x1": 209.37, "r_y1": 701.98, "r_x2": 209.37, "r_y2": 693.96, "r_x3": 157.22, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9, "r_y0": 701.98, "r_x1": 231.85, "r_y1": 701.98, "r_x2": 231.85, "r_y2": 693.96, "r_x3": 218.9, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93, "r_y0": 701.98, "r_x1": 269.32, "r_y1": 701.98, "r_x2": 269.32, "r_y2": 693.96, "r_x3": 239.93, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.39, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 277.39, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 286.36, "r_y1": 712.94, "r_x2": 286.36, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model," }, { "label": "list_item", "id": 14, "page_no": 9, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 328.78, "t": 75.88, "r": 545.11, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.756, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 328.78, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 472.31, "r_y1": 94.86, "r_x2": 472.31, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.89, "r_y0": 94.65, "r_x1": 545.11, "r_y1": 94.65, "r_x2": 545.11, "r_y2": 86.92, "r_x3": 475.89, "r_y3": 86.92, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.61, "r_x1": 371.93, "r_y1": 105.61, "r_x2": 371.93, "r_y2": 97.88, "r_x3": 328.78, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.93, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 371.93, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 417.7, "r_y1": 116.78, "r_x2": 417.7, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7" }, { "label": "list_item", "id": 9, "page_no": 9, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 120.71, "r": 545.11, "b": 161.61, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 128.73, "r_x1": 324.33, "r_y1": 128.73, "r_x2": 324.33, "r_y2": 120.71, "r_x3": 308.86, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65, "r_y0": 128.73, "r_x1": 545.11, "r_y1": 128.73, "r_x2": 545.11, "r_y2": 120.71, "r_x3": 326.65, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 139.69, "r_x1": 545.11, "r_y1": 139.69, "r_x2": 545.11, "r_y2": 131.67, "r_x3": 328.78, "r_y3": 131.67, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 150.44, "r_x1": 545.11, "r_y1": 150.44, "r_x2": 545.11, "r_y2": 142.71, "r_x3": 328.78, "r_y3": 142.71, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.4, "r_x1": 406.32, "r_y1": 161.4, "r_x2": 406.32, "r_y2": 153.67, "r_x3": 328.78, "r_y3": 153.67, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 161.61, "r_x1": 506.18, "r_y1": 161.61, "r_x2": 506.18, "r_y2": 153.59, "r_x3": 406.32, "r_y3": 153.59, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1" }, { "label": "page_footer", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.907, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" } ], "body": [ { "label": "text", "id": 15, "page_no": 9, "cluster": { "id": 15, "label": "text", "bbox": { "l": 70.03, "t": 75.88, "r": 286.36, "b": 94.86, "coord_origin": "TOPLEFT" }, "confidence": 0.689, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 83.69, "r_x1": 223.58, "r_y1": 83.69, "r_x2": 223.58, "r_y2": 75.96, "r_x3": 70.03, "r_y3": 75.96, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.58, "r_y0": 83.9, "r_x1": 286.36, "r_y1": 83.9, "r_x2": 286.36, "r_y2": 75.88, "r_x3": 223.58, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": ", pages 658-666,", "orig": ", pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 94.86, "r_x1": 97.92, "r_y1": 94.86, "r_x2": 97.92, "r_y2": 86.84, "r_x3": 70.03, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6" }, { "label": "list_item", "id": 13, "page_no": 9, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 98.17, "r": 286.37, "b": 160.98, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 106.18, "r_x1": 65.53, "r_y1": 106.18, "r_x2": 65.53, "r_y2": 98.17, "r_x3": 50.11, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 106.18, "r_x1": 286.36, "r_y1": 106.18, "r_x2": 286.36, "r_y2": 98.17, "r_x3": 67.85, "r_y3": 98.17, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 117.14, "r_x1": 286.36, "r_y1": 117.14, "r_x2": 286.36, "r_y2": 109.12, "r_x3": 70.03, "r_y3": 109.12, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 128.1, "r_x1": 286.36, "r_y1": 128.1, "r_x2": 286.36, "r_y2": 120.08, "r_x3": 70.03, "r_y3": 120.08, "coord_origin": "TOPLEFT" }, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 139.06, "r_x1": 77.5, "r_y1": 139.06, "r_x2": 77.5, "r_y2": 131.04, "r_x3": 70.03, "r_y3": 131.04, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 80.56, "r_y0": 138.85, "r_x1": 286.37, "r_y1": 138.85, "r_x2": 286.37, "r_y2": 131.12, "r_x3": 80.56, "r_y3": 131.12, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 149.81, "r_x1": 195.23, "r_y1": 149.81, "r_x2": 195.23, "r_y2": 142.08, "r_x3": 70.03, "r_y3": 142.08, "coord_origin": "TOPLEFT" }, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.23, "r_y0": 150.02, "r_x1": 286.37, "r_y1": 150.02, "r_x2": 286.37, "r_y2": 142.0, "r_x3": 195.23, "r_y3": 142.0, "coord_origin": "TOPLEFT" }, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 160.98, "r_x1": 120.33, "r_y1": 160.98, "r_x2": 120.33, "r_y2": 152.96, "r_x3": 70.03, "r_y3": 152.96, "coord_origin": "TOPLEFT" }, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1" }, { "label": "list_item", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 164.28, "r": 286.36, "b": 227.09, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 172.3, "r_x1": 65.53, "r_y1": 172.3, "r_x2": 65.53, "r_y2": 164.28, "r_x3": 50.11, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.85, "r_y0": 172.3, "r_x1": 286.36, "r_y1": 172.3, "r_x2": 286.36, "r_y2": 164.28, "r_x3": 67.85, "r_y3": 164.28, "coord_origin": "TOPLEFT" }, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 183.26, "r_x1": 286.36, "r_y1": 183.26, "r_x2": 286.36, "r_y2": 175.24, "r_x3": 70.03, "r_y3": 175.24, "coord_origin": "TOPLEFT" }, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 194.22, "r_x1": 286.36, "r_y1": 194.22, "r_x2": 286.36, "r_y2": 186.2, "r_x3": 70.03, "r_y3": 186.2, "coord_origin": "TOPLEFT" }, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 205.18, "r_x1": 101.33, "r_y1": 205.18, "r_x2": 101.33, "r_y2": 197.16, "r_x3": 70.03, "r_y3": 197.16, "coord_origin": "TOPLEFT" }, "text": "ages. In", "orig": "ages. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 104.33, "r_y0": 204.97, "r_x1": 286.36, "r_y1": 204.97, "r_x2": 286.36, "r_y2": 197.24, "r_x3": 104.33, "r_y3": 197.24, "coord_origin": "TOPLEFT" }, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 215.93, "r_x1": 220.49, "r_y1": 215.93, "r_x2": 220.49, "r_y2": 208.2, "r_x3": 70.03, "r_y3": 208.2, "coord_origin": "TOPLEFT" }, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.48, "r_y0": 216.14, "r_x1": 286.36, "r_y1": 216.14, "r_x2": 286.36, "r_y2": 208.12, "r_x3": 220.48, "r_y3": 208.12, "coord_origin": "TOPLEFT" }, "text": ", volume 1, pages", "orig": ", volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 227.09, "r_x1": 166.65, "r_y1": 227.09, "r_x2": 166.65, "r_y2": 219.08, "r_x3": 70.03, "r_y3": 219.08, "coord_origin": "TOPLEFT" }, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3" }, { "label": "list_item", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 50.11, "t": 230.4, "r": 286.37, "b": 271.3, "coord_origin": "TOPLEFT" }, "confidence": 0.851, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 238.42, "r_x1": 65.65, "r_y1": 238.42, "r_x2": 65.65, "r_y2": 230.4, "r_x3": 50.11, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.98, "r_y0": 238.42, "r_x1": 286.36, "r_y1": 238.42, "r_x2": 286.36, "r_y2": 230.4, "r_x3": 67.98, "r_y3": 230.4, "coord_origin": "TOPLEFT" }, "text": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 249.38, "r_x1": 147.17, "r_y1": 249.38, "r_x2": 147.17, "r_y2": 241.36, "r_x3": 70.03, "r_y3": 241.36, "coord_origin": "TOPLEFT" }, "text": "neous documents. In", "orig": "neous documents. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.93, "r_y0": 249.17, "r_x1": 286.37, "r_y1": 249.17, "r_x2": 286.37, "r_y2": 241.44, "r_x3": 149.93, "r_y3": 241.44, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 260.13, "r_x1": 244.69, "r_y1": 260.13, "r_x2": 244.69, "r_y2": 252.4, "r_x3": 70.03, "r_y3": 252.4, "coord_origin": "TOPLEFT" }, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.69, "r_y0": 260.34, "r_x1": 286.36, "r_y1": 260.34, "r_x2": 286.36, "r_y2": 252.32, "r_x3": 244.69, "r_y3": 252.32, "coord_origin": "TOPLEFT" }, "text": ", pages 65-", "orig": ", pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 271.3, "r_x1": 111.37, "r_y1": 271.3, "r_x2": 111.37, "r_y2": 263.28, "r_x3": 70.03, "r_y3": 263.28, "coord_origin": "TOPLEFT" }, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2" }, { "label": "list_item", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 274.6, "r": 286.37, "b": 326.45, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 282.62, "r_x1": 66.02, "r_y1": 282.62, "r_x2": 66.02, "r_y2": 274.6, "r_x3": 50.11, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.41, "r_y0": 282.62, "r_x1": 94.94, "r_y1": 282.62, "r_x2": 94.94, "r_y2": 274.6, "r_x3": 68.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 100.87, "r_y0": 282.62, "r_x1": 127.27, "r_y1": 282.62, "r_x2": 127.27, "r_y2": 274.6, "r_x3": 100.87, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.19, "r_y0": 282.62, "r_x1": 165.83, "r_y1": 282.62, "r_x2": 165.83, "r_y2": 274.6, "r_x3": 133.19, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.68, "r_y0": 282.62, "r_x1": 194.09, "r_y1": 282.62, "r_x2": 194.09, "r_y2": 274.6, "r_x3": 172.68, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.02, "r_y0": 282.62, "r_x1": 211.48, "r_y1": 282.62, "r_x2": 211.48, "r_y2": 274.6, "r_x3": 200.02, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.41, "r_y0": 282.62, "r_x1": 239.44, "r_y1": 282.62, "r_x2": 239.44, "r_y2": 274.6, "r_x3": 217.41, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.29, "r_y0": 282.62, "r_x1": 264.22, "r_y1": 282.62, "r_x2": 264.22, "r_y2": 274.6, "r_x3": 246.29, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.15, "r_y0": 282.62, "r_x1": 286.36, "r_y1": 282.62, "r_x2": 286.36, "r_y2": 274.6, "r_x3": 270.15, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 293.58, "r_x1": 286.36, "r_y1": 293.58, "r_x2": 286.36, "r_y2": 285.56, "r_x3": 70.03, "r_y3": 285.56, "coord_origin": "TOPLEFT" }, "text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 304.54, "r_x1": 286.36, "r_y1": 304.54, "r_x2": 286.36, "r_y2": 296.52, "r_x3": 70.03, "r_y3": 296.52, "coord_origin": "TOPLEFT" }, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 315.5, "r_x1": 77.5, "r_y1": 315.5, "r_x2": 77.5, "r_y2": 307.48, "r_x3": 70.03, "r_y3": 307.48, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 79.35, "r_y0": 315.29, "r_x1": 286.37, "r_y1": 315.29, "r_x2": 286.37, "r_y2": 307.56, "r_x3": 79.35, "r_y3": 307.56, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 326.25, "r_x1": 147.57, "r_y1": 326.25, "r_x2": 147.57, "r_y2": 318.52, "r_x3": 70.03, "r_y3": 318.52, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.57, "r_y0": 326.45, "r_x1": 271.34, "r_y1": 326.45, "r_x2": 271.34, "r_y2": 318.44, "r_x3": 147.57, "r_y3": 318.44, "coord_origin": "TOPLEFT" }, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3" }, { "label": "list_item", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 50.11, "t": 329.76, "r": 286.36, "b": 381.61, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 337.78, "r_x1": 65.37, "r_y1": 337.78, "r_x2": 65.37, "r_y2": 329.76, "r_x3": 50.11, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.66, "r_y0": 337.78, "r_x1": 286.36, "r_y1": 337.78, "r_x2": 286.36, "r_y2": 329.76, "r_x3": 67.66, "r_y3": 329.76, "coord_origin": "TOPLEFT" }, "text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 348.74, "r_x1": 286.36, "r_y1": 348.74, "r_x2": 286.36, "r_y2": 340.72, "r_x3": 70.03, "r_y3": 340.72, "coord_origin": "TOPLEFT" }, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 359.7, "r_x1": 198.82, "r_y1": 359.7, "r_x2": 198.82, "r_y2": 351.68, "r_x3": 70.03, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.06, "r_y0": 359.7, "r_x1": 213.53, "r_y1": 359.7, "r_x2": 213.53, "r_y2": 351.68, "r_x3": 206.06, "r_y3": 351.68, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.02, "r_y0": 359.49, "r_x1": 286.36, "r_y1": 359.49, "r_x2": 286.36, "r_y2": 351.76, "r_x3": 217.02, "r_y3": 351.76, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.03, "r_y3": 362.72, "coord_origin": "TOPLEFT" }, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 143.08, "r_y0": 370.66, "r_x1": 286.36, "r_y1": 370.66, "r_x2": 286.36, "r_y2": 362.64, "r_x3": 143.08, "r_y3": 362.64, "coord_origin": "TOPLEFT" }, "text": ", KDD \u201918, pages 774-782, New York,", "orig": ", KDD \u201918, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 381.61, "r_x1": 161.16, "r_y1": 381.61, "r_x2": 161.16, "r_y2": 373.6, "r_x3": 70.03, "r_y3": 373.6, "coord_origin": "TOPLEFT" }, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1" }, { "label": "list_item", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 50.11, "t": 384.92, "r": 286.36, "b": 458.69, "coord_origin": "TOPLEFT" }, "confidence": 0.883, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 392.94, "r_x1": 65.14, "r_y1": 392.94, "r_x2": 65.14, "r_y2": 384.92, "r_x3": 50.11, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.4, "r_y0": 392.94, "r_x1": 286.36, "r_y1": 392.94, "r_x2": 286.36, "r_y2": 384.92, "r_x3": 67.4, "r_y3": 384.92, "coord_origin": "TOPLEFT" }, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 403.9, "r_x1": 286.36, "r_y1": 403.9, "r_x2": 286.36, "r_y2": 395.88, "r_x3": 70.03, "r_y3": 395.88, "coord_origin": "TOPLEFT" }, "text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 414.86, "r_x1": 125.47, "r_y1": 414.86, "r_x2": 125.47, "r_y2": 406.84, "r_x3": 70.03, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "lia Polosukhin.", "orig": "lia Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 133.91, "r_y0": 414.86, "r_x1": 230.83, "r_y1": 414.86, "r_x2": 230.83, "r_y2": 406.84, "r_x3": 133.91, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "Attention is all you need.", "orig": "Attention is all you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.27, "r_y0": 414.86, "r_x1": 286.36, "r_y1": 414.86, "r_x2": 286.36, "r_y2": 406.84, "r_x3": 239.27, "r_y3": 406.84, "coord_origin": "TOPLEFT" }, "text": "In I. Guyon,", "orig": "In I. Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 425.82, "r_x1": 78.96, "r_y1": 425.82, "r_x2": 78.96, "r_y2": 417.8, "r_x3": 70.03, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "U.", "orig": "U.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 81.25, "r_y0": 425.82, "r_x1": 286.36, "r_y1": 425.82, "r_x2": 286.36, "r_y2": 417.8, "r_x3": 81.25, "r_y3": 417.8, "coord_origin": "TOPLEFT" }, "text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 436.77, "r_x1": 196.76, "r_y1": 436.77, "r_x2": 196.76, "r_y2": 428.76, "r_x3": 70.03, "r_y3": 428.76, "coord_origin": "TOPLEFT" }, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.2, "r_y0": 436.57, "r_x1": 286.36, "r_y1": 436.57, "r_x2": 286.36, "r_y2": 428.84, "r_x3": 200.2, "r_y3": 428.84, "coord_origin": "TOPLEFT" }, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 447.53, "r_x1": 189.19, "r_y1": 447.53, "r_x2": 189.19, "r_y2": 439.8, "r_x3": 70.03, "r_y3": 439.8, "coord_origin": "TOPLEFT" }, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 447.73, "r_x1": 286.36, "r_y1": 447.73, "r_x2": 286.36, "r_y2": 439.72, "r_x3": 189.2, "r_y3": 439.72, "coord_origin": "TOPLEFT" }, "text": ", pages 5998-6008. Curran", "orig": ", pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 458.69, "r_x1": 158.92, "r_y1": 458.69, "r_x2": 158.92, "r_y2": 450.68, "r_x3": 70.03, "r_y3": 450.68, "coord_origin": "TOPLEFT" }, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5" }, { "label": "list_item", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 50.11, "t": 462.0, "r": 286.36, "b": 502.89, "coord_origin": "TOPLEFT" }, "confidence": 0.843, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 470.02, "r_x1": 65.91, "r_y1": 470.02, "r_x2": 65.91, "r_y2": 462.0, "r_x3": 50.11, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.28, "r_y0": 470.02, "r_x1": 286.36, "r_y1": 470.02, "r_x2": 286.36, "r_y2": 462.0, "r_x3": 68.28, "r_y3": 462.0, "coord_origin": "TOPLEFT" }, "text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 480.97, "r_x1": 116.28, "r_y1": 480.97, "r_x2": 116.28, "r_y2": 472.96, "r_x3": 70.03, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.48, "r_y0": 480.97, "r_x1": 286.36, "r_y1": 480.97, "r_x2": 286.36, "r_y2": 472.96, "r_x3": 122.48, "r_y3": 472.96, "coord_origin": "TOPLEFT" }, "text": "Show and tell: A neural image caption gen-", "orig": "Show and tell: A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 491.93, "r_x1": 103.31, "r_y1": 491.93, "r_x2": 103.31, "r_y2": 483.92, "r_x3": 70.03, "r_y3": 483.92, "coord_origin": "TOPLEFT" }, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 105.52, "r_y0": 491.73, "r_x1": 286.36, "r_y1": 491.73, "r_x2": 286.36, "r_y2": 484.0, "r_x3": 105.52, "r_y3": 484.0, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 502.69, "r_x1": 212.52, "r_y1": 502.69, "r_x2": 212.52, "r_y2": 494.96, "r_x3": 70.03, "r_y3": 494.96, "coord_origin": "TOPLEFT" }, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.51, "r_y0": 502.89, "r_x1": 263.56, "r_y1": 502.89, "r_x2": 263.56, "r_y2": 494.88, "r_x3": 212.51, "r_y3": 494.88, "coord_origin": "TOPLEFT" }, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2" }, { "label": "list_item", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 50.11, "t": 506.2, "r": 286.36, "b": 547.09, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 514.22, "r_x1": 65.68, "r_y1": 514.22, "r_x2": 65.68, "r_y2": 506.2, "r_x3": 50.11, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.02, "r_y0": 514.22, "r_x1": 247.37, "r_y1": 514.22, "r_x2": 247.37, "r_y2": 506.2, "r_x3": 68.02, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.97, "r_y0": 514.22, "r_x1": 286.36, "r_y1": 514.22, "r_x2": 286.36, "r_y2": 506.2, "r_x3": 253.97, "r_y3": 506.2, "coord_origin": "TOPLEFT" }, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 525.18, "r_x1": 265.62, "r_y1": 525.18, "r_x2": 265.62, "r_y2": 517.16, "r_x3": 70.03, "r_y3": 517.16, "coord_origin": "TOPLEFT" }, "text": "reconstruct syntactic structures from table images. In", "orig": "reconstruct syntactic structures from table images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 268.43, "r_y0": 524.97, "r_x1": 286.36, "r_y1": 524.97, "r_x2": 286.36, "r_y2": 517.24, "r_x3": 268.43, "r_y3": 517.24, "coord_origin": "TOPLEFT" }, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 535.93, "r_x1": 286.36, "r_y1": 535.93, "r_x2": 286.36, "r_y2": 528.2, "r_x3": 70.03, "r_y3": 528.2, "coord_origin": "TOPLEFT" }, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 546.89, "r_x1": 125.26, "r_y1": 546.89, "r_x2": 125.26, "r_y2": 539.16, "r_x3": 70.03, "r_y3": 539.16, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.25, "r_y0": 547.09, "r_x1": 240.05, "r_y1": 547.09, "r_x2": 240.05, "r_y2": 539.08, "r_x3": 125.25, "r_y3": 539.08, "coord_origin": "TOPLEFT" }, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3" }, { "label": "list_item", "id": 11, "page_no": 9, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 50.11, "t": 550.4, "r": 286.36, "b": 591.29, "coord_origin": "TOPLEFT" }, "confidence": 0.824, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 558.42, "r_x1": 66.04, "r_y1": 558.42, "r_x2": 66.04, "r_y2": 550.4, "r_x3": 50.11, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.43, "r_y0": 558.42, "r_x1": 286.36, "r_y1": 558.42, "r_x2": 286.36, "r_y2": 550.4, "r_x3": 68.43, "r_y3": 550.4, "coord_origin": "TOPLEFT" }, "text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 569.38, "r_x1": 137.08, "r_y1": 569.38, "r_x2": 137.08, "r_y2": 561.36, "r_x3": 70.03, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.99, "r_y0": 569.38, "r_x1": 172.38, "r_y1": 569.38, "r_x2": 172.38, "r_y2": 561.36, "r_x3": 145.99, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.7, "r_y0": 569.38, "r_x1": 286.36, "r_y1": 569.38, "r_x2": 286.36, "r_y2": 561.36, "r_x3": 178.7, "r_y3": 561.36, "coord_origin": "TOPLEFT" }, "text": "A table graph reconstruction", "orig": "A table graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 580.33, "r_x1": 221.01, "r_y1": 580.33, "r_x2": 221.01, "r_y2": 572.32, "r_x3": 70.03, "r_y3": 572.32, "coord_origin": "TOPLEFT" }, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.54, "r_y0": 580.13, "r_x1": 286.36, "r_y1": 580.13, "r_x2": 286.36, "r_y2": 572.4, "r_x3": 232.54, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "arXiv preprint", "orig": "arXiv preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 591.09, "r_x1": 135.53, "r_y1": 591.09, "r_x2": 135.53, "r_y2": 583.36, "r_x3": 70.03, "r_y3": 583.36, "coord_origin": "TOPLEFT" }, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 135.53, "r_y0": 591.29, "r_x1": 167.9, "r_y1": 591.29, "r_x2": 167.9, "r_y2": 583.28, "r_x3": 135.53, "r_y3": 583.28, "coord_origin": "TOPLEFT" }, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3" }, { "label": "list_item", "id": 10, "page_no": 9, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 594.6, "r": 286.36, "b": 635.49, "coord_origin": "TOPLEFT" }, "confidence": 0.836, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 602.62, "r_x1": 65.24, "r_y1": 602.62, "r_x2": 65.24, "r_y2": 594.6, "r_x3": 50.11, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.51, "r_y0": 602.62, "r_x1": 286.36, "r_y1": 602.62, "r_x2": 286.36, "r_y2": 594.6, "r_x3": 67.51, "r_y3": 594.6, "coord_origin": "TOPLEFT" }, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 613.58, "r_x1": 109.11, "r_y1": 613.58, "r_x2": 109.11, "r_y2": 605.56, "r_x3": 70.03, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.23, "r_y0": 613.58, "r_x1": 271.77, "r_y1": 613.58, "r_x2": 271.77, "r_y2": 605.56, "r_x3": 116.23, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.89, "r_y0": 613.58, "r_x1": 286.36, "r_y1": 613.58, "r_x2": 286.36, "r_y2": 605.56, "r_x3": 278.89, "r_y3": 605.56, "coord_origin": "TOPLEFT" }, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 624.33, "r_x1": 286.36, "r_y1": 624.33, "r_x2": 286.36, "r_y2": 616.6, "r_x3": 70.03, "r_y3": 616.6, "coord_origin": "TOPLEFT" }, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 635.29, "r_x1": 139.1, "r_y1": 635.29, "r_x2": 139.1, "r_y2": 627.56, "r_x3": 70.03, "r_y3": 627.56, "coord_origin": "TOPLEFT" }, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.1, "r_y0": 635.49, "r_x1": 238.96, "r_y1": 635.49, "r_x2": 238.96, "r_y2": 627.48, "r_x3": 139.1, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4" }, { "label": "list_item", "id": 12, "page_no": 9, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 50.11, "t": 638.8, "r": 286.36, "b": 690.65, "coord_origin": "TOPLEFT" }, "confidence": 0.808, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 646.82, "r_x1": 65.2, "r_y1": 646.82, "r_x2": 65.2, "r_y2": 638.8, "r_x3": 50.11, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.47, "r_y0": 646.82, "r_x1": 286.36, "r_y1": 646.82, "r_x2": 286.36, "r_y2": 638.8, "r_x3": 67.47, "r_y3": 638.8, "coord_origin": "TOPLEFT" }, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 657.78, "r_x1": 286.36, "r_y1": 657.78, "r_x2": 286.36, "r_y2": 649.76, "r_x3": 70.03, "r_y3": 649.76, "coord_origin": "TOPLEFT" }, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 668.74, "r_x1": 286.36, "r_y1": 668.74, "r_x2": 286.36, "r_y2": 660.72, "r_x3": 70.03, "r_y3": 660.72, "coord_origin": "TOPLEFT" }, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 679.69, "r_x1": 158.46, "r_y1": 679.69, "r_x2": 158.46, "r_y2": 671.68, "r_x3": 70.03, "r_y3": 671.68, "coord_origin": "TOPLEFT" }, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.53, "r_y0": 679.49, "r_x1": 286.36, "r_y1": 679.49, "r_x2": 286.36, "r_y2": 671.76, "r_x3": 160.53, "r_y3": 671.76, "coord_origin": "TOPLEFT" }, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 690.45, "r_x1": 171.42, "r_y1": 690.45, "r_x2": 171.42, "r_y2": 682.72, "r_x3": 70.03, "r_y3": 682.72, "coord_origin": "TOPLEFT" }, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.42, "r_y0": 690.65, "r_x1": 212.76, "r_y1": 690.65, "r_x2": 212.76, "r_y2": 682.64, "r_x3": 171.42, "r_y3": 682.64, "coord_origin": "TOPLEFT" }, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3" }, { "label": "list_item", "id": 8, "page_no": 9, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 693.96, "r": 286.36, "b": 712.94, "coord_origin": "TOPLEFT" }, "confidence": 0.839, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 701.98, "r_x1": 66.51, "r_y1": 701.98, "r_x2": 66.51, "r_y2": 693.96, "r_x3": 50.11, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 68.97, "r_y0": 701.98, "r_x1": 80.99, "r_y1": 701.98, "r_x2": 80.99, "r_y2": 693.96, "r_x3": 68.97, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 89.06, "r_y0": 701.98, "r_x1": 114.71, "r_y1": 701.98, "r_x2": 114.71, "r_y2": 693.96, "r_x3": 89.06, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 124.25, "r_y0": 701.98, "r_x1": 149.15, "r_y1": 701.98, "r_x2": 149.15, "r_y2": 693.96, "r_x3": 124.25, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 157.22, "r_y0": 701.98, "r_x1": 209.37, "r_y1": 701.98, "r_x2": 209.37, "r_y2": 693.96, "r_x3": 157.22, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 218.9, "r_y0": 701.98, "r_x1": 231.85, "r_y1": 701.98, "r_x2": 231.85, "r_y2": 693.96, "r_x3": 218.9, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.93, "r_y0": 701.98, "r_x1": 269.32, "r_y1": 701.98, "r_x2": 269.32, "r_y2": 693.96, "r_x3": 239.93, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 277.39, "r_y0": 701.98, "r_x1": 286.36, "r_y1": 701.98, "r_x2": 286.36, "r_y2": 693.96, "r_x3": 277.39, "r_y3": 693.96, "coord_origin": "TOPLEFT" }, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.03, "r_y0": 712.94, "r_x1": 286.36, "r_y1": 712.94, "r_x2": 286.36, "r_y2": 704.92, "r_x3": 70.03, "r_y3": 704.92, "coord_origin": "TOPLEFT" }, "text": "meno Yepes. Image-based table recognition: Data, model,", "orig": "meno Yepes. Image-based table recognition: Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model," }, { "label": "list_item", "id": 14, "page_no": 9, "cluster": { "id": 14, "label": "list_item", "bbox": { "l": 328.78, "t": 75.88, "r": 545.11, "b": 116.78, "coord_origin": "TOPLEFT" }, "confidence": 0.756, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 83.9, "r_x1": 545.11, "r_y1": 83.9, "r_x2": 545.11, "r_y2": 75.88, "r_x3": 328.78, "r_y3": 75.88, "coord_origin": "TOPLEFT" }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 94.86, "r_x1": 472.31, "r_y1": 94.86, "r_x2": 472.31, "r_y2": 86.84, "r_x3": 328.78, "r_y3": 86.84, "coord_origin": "TOPLEFT" }, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.89, "r_y0": 94.65, "r_x1": 545.11, "r_y1": 94.65, "r_x2": 545.11, "r_y2": 86.92, "r_x3": 475.89, "r_y3": 86.92, "coord_origin": "TOPLEFT" }, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 105.61, "r_x1": 371.93, "r_y1": 105.61, "r_x2": 371.93, "r_y2": 97.88, "r_x3": 328.78, "r_y3": 97.88, "coord_origin": "TOPLEFT" }, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 371.93, "r_y0": 105.82, "r_x1": 545.11, "r_y1": 105.82, "r_x2": 545.11, "r_y2": 97.8, "r_x3": 371.93, "r_y3": 97.8, "coord_origin": "TOPLEFT" }, "text": ", pages 564-580, Cham, 2020. Springer Interna-", "orig": ", pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 116.78, "r_x1": 417.7, "r_y1": 116.78, "r_x2": 417.7, "r_y2": 108.76, "r_x3": 328.78, "r_y3": 108.76, "coord_origin": "TOPLEFT" }, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7" }, { "label": "list_item", "id": 9, "page_no": 9, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 120.71, "r": 545.11, "b": 161.61, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 128.73, "r_x1": 324.33, "r_y1": 128.73, "r_x2": 324.33, "r_y2": 120.71, "r_x3": 308.86, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.65, "r_y0": 128.73, "r_x1": 545.11, "r_y1": 128.73, "r_x2": 545.11, "r_y2": 120.71, "r_x3": 326.65, "r_y3": 120.71, "coord_origin": "TOPLEFT" }, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 139.69, "r_x1": 545.11, "r_y1": 139.69, "r_x2": 545.11, "r_y2": 131.67, "r_x3": 328.78, "r_y3": 131.67, "coord_origin": "TOPLEFT" }, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 150.44, "r_x1": 545.11, "r_y1": 150.44, "r_x2": 545.11, "r_y2": 142.71, "r_x3": 328.78, "r_y3": 142.71, "coord_origin": "TOPLEFT" }, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 328.78, "r_y0": 161.4, "r_x1": 406.32, "r_y1": 161.4, "r_x2": 406.32, "r_y2": 153.67, "r_x3": 328.78, "r_y3": 153.67, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.32, "r_y0": 161.61, "r_x1": 506.18, "r_y1": 161.61, "r_x2": 506.18, "r_y2": 153.59, "r_x3": 406.32, "r_y3": 153.59, "coord_origin": "TOPLEFT" }, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1" } ], "headers": [ { "label": "page_footer", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.907, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" } ] } }, { "page_no": 10, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.84, "r_y0": 121.32, "r_x1": 465.38, "r_y1": 121.32, "r_x2": 465.38, "r_y2": 110.57, "r_x3": 132.84, "r_y3": 110.57, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18, "r_y0": 135.53, "r_x1": 375.04, "r_y1": 135.53, "r_x2": 375.04, "r_y2": 122.26, "r_x3": 220.18, "r_y3": 122.26, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 171.91, "r_x1": 57.09, "r_y1": 171.91, "r_x2": 57.09, "r_y2": 161.16, "r_x3": 50.11, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.39, "r_y0": 171.91, "r_x1": 175.96, "r_y1": 171.91, "r_x2": 175.96, "r_y2": 161.16, "r_x3": 66.39, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 190.83, "r_x1": 64.21, "r_y1": 190.83, "r_x2": 64.21, "r_y2": 180.98, "r_x3": 50.11, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.61, "r_y0": 190.83, "r_x1": 150.36, "r_y1": 190.83, "r_x2": 150.36, "r_y2": 180.98, "r_x3": 73.61, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 208.83, "r_x1": 286.36, "r_y1": 208.83, "r_x2": 286.36, "r_y2": 199.92, "r_x3": 62.07, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 220.78, "r_x1": 286.37, "r_y1": 220.78, "r_x2": 286.37, "r_y2": 211.88, "r_x3": 50.11, "r_y3": 211.88, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 232.74, "r_x1": 286.37, "r_y1": 232.74, "r_x2": 286.37, "r_y2": 223.83, "r_x3": 50.11, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 244.69, "r_x1": 286.37, "r_y1": 244.69, "r_x2": 286.37, "r_y2": 235.79, "r_x3": 50.11, "r_y3": 235.79, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 256.65, "r_x1": 286.37, "r_y1": 256.65, "r_x2": 286.37, "r_y2": 247.74, "r_x3": 50.11, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 268.6, "r_x1": 286.37, "r_y1": 268.6, "r_x2": 286.37, "r_y2": 259.7, "r_x3": 50.11, "r_y3": 259.7, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 280.56, "r_x1": 286.37, "r_y1": 280.56, "r_x2": 286.37, "r_y2": 271.65, "r_x3": 50.11, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 292.51, "r_x1": 286.37, "r_y1": 292.51, "r_x2": 286.37, "r_y2": 283.61, "r_x3": 50.11, "r_y3": 283.61, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 304.47, "r_x1": 286.37, "r_y1": 304.47, "r_x2": 286.37, "r_y2": 295.56, "r_x3": 50.11, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 316.42, "r_x1": 286.37, "r_y1": 316.42, "r_x2": 286.37, "r_y2": 307.52, "r_x3": 50.11, "r_y3": 307.52, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 328.38, "r_x1": 286.37, "r_y1": 328.38, "r_x2": 286.37, "r_y2": 319.47, "r_x3": 50.11, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 340.33, "r_x1": 286.37, "r_y1": 340.33, "r_x2": 286.37, "r_y2": 331.43, "r_x3": 50.11, "r_y3": 331.43, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 352.29, "r_x1": 286.37, "r_y1": 352.29, "r_x2": 286.37, "r_y2": 343.38, "r_x3": 50.11, "r_y3": 343.38, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 364.24, "r_x1": 286.37, "r_y1": 364.24, "r_x2": 286.37, "r_y2": 355.34, "r_x3": 50.11, "r_y3": 355.34, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 376.2, "r_x1": 286.37, "r_y1": 376.2, "r_x2": 286.37, "r_y2": 367.29, "r_x3": 50.11, "r_y3": 367.29, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 388.15, "r_x1": 230.8, "r_y1": 388.15, "r_x2": 230.8, "r_y2": 379.25, "r_x3": 50.11, "r_y3": 379.25, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 400.31, "r_x1": 286.36, "r_y1": 400.31, "r_x2": 286.36, "r_y2": 391.41, "r_x3": 62.07, "r_y3": 391.41, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 412.27, "r_x1": 286.37, "r_y1": 412.27, "r_x2": 286.37, "r_y2": 403.36, "r_x3": 50.11, "r_y3": 403.36, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 424.22, "r_x1": 286.37, "r_y1": 424.22, "r_x2": 286.37, "r_y2": 415.32, "r_x3": 50.11, "r_y3": 415.32, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 436.18, "r_x1": 286.37, "r_y1": 436.18, "r_x2": 286.37, "r_y2": 427.27, "r_x3": 50.11, "r_y3": 427.27, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.13, "r_x1": 286.37, "r_y1": 448.13, "r_x2": 286.37, "r_y2": 439.23, "r_x3": 50.11, "r_y3": 439.23, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.09, "r_x1": 286.37, "r_y1": 460.09, "r_x2": 286.37, "r_y2": 451.18, "r_x3": 50.11, "r_y3": 451.18, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.04, "r_x1": 286.37, "r_y1": 472.04, "r_x2": 286.37, "r_y2": 463.14, "r_x3": 50.11, "r_y3": 463.14, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.0, "r_x1": 286.37, "r_y1": 484.0, "r_x2": 286.37, "r_y2": 475.09, "r_x3": 50.11, "r_y3": 475.09, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 495.95, "r_x1": 286.37, "r_y1": 495.95, "r_x2": 286.37, "r_y2": 487.05, "r_x3": 50.11, "r_y3": 487.05, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 507.91, "r_x1": 286.37, "r_y1": 507.91, "r_x2": 286.37, "r_y2": 499.0, "r_x3": 50.11, "r_y3": 499.0, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 519.86, "r_x1": 286.37, "r_y1": 519.86, "r_x2": 286.37, "r_y2": 510.96, "r_x3": 50.11, "r_y3": 510.96, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.82, "r_x1": 286.37, "r_y1": 531.82, "r_x2": 286.37, "r_y2": 522.91, "r_x3": 50.11, "r_y3": 522.91, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.77, "r_x1": 286.37, "r_y1": 543.77, "r_x2": 286.37, "r_y2": 534.87, "r_x3": 50.11, "r_y3": 534.87, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.73, "r_x1": 286.37, "r_y1": 555.73, "r_x2": 286.37, "r_y2": 546.82, "r_x3": 50.11, "r_y3": 546.82, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.68, "r_x1": 257.47, "r_y1": 567.68, "r_x2": 257.47, "r_y2": 558.78, "r_x3": 50.11, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.95, "r_y0": 567.68, "r_x1": 286.37, "r_y1": 567.68, "r_x2": 286.37, "r_y2": 558.78, "r_x3": 263.95, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.64, "r_x1": 286.37, "r_y1": 579.64, "r_x2": 286.37, "r_y2": 570.73, "r_x3": 50.11, "r_y3": 570.73, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.59, "r_x1": 286.37, "r_y1": 591.59, "r_x2": 286.37, "r_y2": 582.69, "r_x3": 50.11, "r_y3": 582.69, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.55, "r_x1": 286.37, "r_y1": 603.55, "r_x2": 286.37, "r_y2": 594.64, "r_x3": 50.11, "r_y3": 594.64, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.5, "r_x1": 286.37, "r_y1": 615.5, "r_x2": 286.37, "r_y2": 606.6, "r_x3": 50.11, "r_y3": 606.6, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.46, "r_x1": 242.26, "r_y1": 627.46, "r_x2": 242.26, "r_y2": 618.55, "r_x3": 50.11, "r_y3": 618.55, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 639.62, "r_x1": 286.36, "r_y1": 639.62, "r_x2": 286.36, "r_y2": 630.71, "r_x3": 62.07, "r_y3": 630.71, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 651.57, "r_x1": 179.9, "r_y1": 651.57, "r_x2": 179.9, "r_y2": 642.67, "r_x3": 50.11, "r_y3": 642.67, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 672.24, "r_x1": 64.3, "r_y1": 672.24, "r_x2": 64.3, "r_y2": 662.39, "r_x3": 50.11, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.75, "r_y0": 672.24, "r_x1": 153.61, "r_y1": 672.24, "r_x2": 153.61, "r_y2": 662.39, "r_x3": 73.75, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 690.24, "r_x1": 286.36, "r_y1": 690.24, "r_x2": 286.36, "r_y2": 681.33, "r_x3": 62.07, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 702.19, "r_x1": 286.37, "r_y1": 702.19, "r_x2": 286.37, "r_y2": 693.29, "r_x3": 50.11, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 714.15, "r_x1": 84.14, "r_y1": 714.15, "r_x2": 84.14, "r_y2": 705.24, "r_x3": 50.11, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.24, "r_y0": 714.15, "r_x1": 286.37, "r_y1": 714.15, "r_x2": 286.37, "r_y2": 705.24, "r_x3": 91.24, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 171.56, "r_x1": 545.12, "r_y1": 171.56, "r_x2": 545.12, "r_y2": 162.66, "r_x3": 308.86, "r_y3": 162.66, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.52, "r_x1": 545.12, "r_y1": 183.52, "r_x2": 545.12, "r_y2": 174.61, "r_x3": 308.86, "r_y3": 174.61, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 195.47, "r_x1": 545.12, "r_y1": 195.47, "r_x2": 545.12, "r_y2": 186.57, "r_x3": 308.86, "r_y3": 186.57, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 207.43, "r_x1": 484.07, "r_y1": 207.43, "r_x2": 484.07, "r_y2": 198.52, "r_x3": 308.86, "r_y3": 198.52, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 220.14, "r_x1": 545.12, "r_y1": 220.14, "r_x2": 545.12, "r_y2": 211.24, "r_x3": 320.82, "r_y3": 211.24, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.1, "r_x1": 448.09, "r_y1": 232.1, "r_x2": 448.09, "r_y2": 223.19, "r_x3": 308.86, "r_y3": 223.19, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 244.81, "r_x1": 328.29, "r_y1": 244.81, "r_x2": 328.29, "r_y2": 235.91, "r_x3": 320.82, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38, "r_y0": 244.81, "r_x1": 545.11, "r_y1": 244.81, "r_x2": 545.11, "r_y2": 235.91, "r_x3": 335.38, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.77, "r_x1": 545.12, "r_y1": 256.77, "r_x2": 545.12, "r_y2": 247.86, "r_x3": 308.86, "r_y3": 247.86, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.72, "r_x1": 545.12, "r_y1": 268.72, "r_x2": 545.12, "r_y2": 259.82, "r_x3": 308.86, "r_y3": 259.82, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.68, "r_x1": 393.38, "r_y1": 280.68, "r_x2": 393.38, "r_y2": 271.77, "r_x3": 308.86, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.12, "r_y0": 280.68, "r_x1": 545.12, "r_y1": 280.68, "r_x2": 545.12, "r_y2": 271.77, "r_x3": 400.12, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.63, "r_x1": 545.12, "r_y1": 292.63, "r_x2": 545.12, "r_y2": 283.73, "r_x3": 308.86, "r_y3": 283.73, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.59, "r_x1": 545.12, "r_y1": 304.59, "r_x2": 545.12, "r_y2": 295.68, "r_x3": 308.86, "r_y3": 295.68, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.54, "r_x1": 425.69, "r_y1": 316.54, "r_x2": 425.69, "r_y2": 307.64, "r_x3": 308.86, "r_y3": 307.64, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 329.26, "r_x1": 328.49, "r_y1": 329.26, "r_x2": 328.49, "r_y2": 320.35, "r_x3": 320.82, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05, "r_y0": 329.26, "r_x1": 545.11, "r_y1": 329.26, "r_x2": 545.11, "r_y2": 320.35, "r_x3": 331.05, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 341.21, "r_x1": 545.12, "r_y1": 341.21, "r_x2": 545.12, "r_y2": 332.31, "r_x3": 308.86, "r_y3": 332.31, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 353.17, "r_x1": 545.12, "r_y1": 353.17, "r_x2": 545.12, "r_y2": 344.26, "r_x3": 308.86, "r_y3": 344.26, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 365.12, "r_x1": 545.12, "r_y1": 365.12, "r_x2": 545.12, "r_y2": 356.22, "r_x3": 308.86, "r_y3": 356.22, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 377.08, "r_x1": 545.12, "r_y1": 377.08, "r_x2": 545.12, "r_y2": 368.17, "r_x3": 308.86, "r_y3": 368.17, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 389.03, "r_x1": 545.11, "r_y1": 389.03, "r_x2": 545.11, "r_y2": 380.13, "r_x3": 308.86, "r_y3": 380.13, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.99, "r_x1": 545.12, "r_y1": 400.99, "r_x2": 545.12, "r_y2": 392.08, "r_x3": 308.86, "r_y3": 392.08, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.94, "r_x1": 545.12, "r_y1": 412.94, "r_x2": 545.12, "r_y2": 404.04, "r_x3": 308.86, "r_y3": 404.04, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.9, "r_x1": 545.11, "r_y1": 424.9, "r_x2": 545.11, "r_y2": 415.99, "r_x3": 308.86, "r_y3": 415.99, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.85, "r_x1": 545.12, "r_y1": 436.85, "r_x2": 545.12, "r_y2": 427.95, "r_x3": 308.86, "r_y3": 427.95, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.81, "r_x1": 345.94, "r_y1": 448.81, "r_x2": 345.94, "r_y2": 439.9, "r_x3": 308.86, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 461.52, "r_x1": 328.3, "r_y1": 461.52, "r_x2": 328.3, "r_y2": 452.62, "r_x3": 320.82, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.8, "r_y0": 461.52, "r_x1": 485.76, "r_y1": 461.52, "r_x2": 485.76, "r_y2": 452.62, "r_x3": 330.8, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.07, "r_y0": 461.29, "r_x1": 511.86, "r_y1": 461.29, "r_x2": 511.86, "r_y2": 452.71, "r_x3": 488.07, "r_y3": 452.71, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86, "r_y0": 461.52, "r_x1": 545.11, "r_y1": 461.52, "r_x2": 545.11, "r_y2": 452.62, "r_x3": 511.86, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.48, "r_x1": 545.12, "r_y1": 473.48, "r_x2": 545.12, "r_y2": 464.57, "r_x3": 308.86, "r_y3": 464.57, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.43, "r_x1": 545.12, "r_y1": 485.43, "r_x2": 545.12, "r_y2": 476.53, "r_x3": 308.86, "r_y3": 476.53, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.39, "r_x1": 379.15, "r_y1": 497.39, "r_x2": 379.15, "r_y2": 488.48, "r_x3": 308.86, "r_y3": 488.48, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 510.1, "r_x1": 328.66, "r_y1": 510.1, "r_x2": 328.66, "r_y2": 501.2, "r_x3": 320.82, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.28, "r_y0": 510.1, "r_x1": 545.11, "r_y1": 510.1, "r_x2": 545.11, "r_y2": 501.2, "r_x3": 331.28, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 522.06, "r_x1": 545.12, "r_y1": 522.06, "r_x2": 545.12, "r_y2": 513.15, "r_x3": 308.86, "r_y3": 513.15, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 534.01, "r_x1": 384.3, "r_y1": 534.01, "r_x2": 384.3, "r_y2": 525.11, "r_x3": 308.86, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25, "r_y0": 534.01, "r_x1": 545.12, "r_y1": 534.01, "r_x2": 545.12, "r_y2": 525.11, "r_x3": 391.25, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.97, "r_x1": 496.16, "r_y1": 545.97, "r_x2": 496.16, "r_y2": 537.06, "r_x3": 308.86, "r_y3": 537.06, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 558.68, "r_x1": 328.29, "r_y1": 558.68, "r_x2": 328.29, "r_y2": 549.78, "r_x3": 320.82, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.4, "r_y0": 558.68, "r_x1": 545.11, "r_y1": 558.68, "r_x2": 545.11, "r_y2": 549.78, "r_x3": 335.4, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 570.64, "r_x1": 545.12, "r_y1": 570.64, "r_x2": 545.12, "r_y2": 561.73, "r_x3": 308.86, "r_y3": 561.73, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 582.59, "r_x1": 545.12, "r_y1": 582.59, "r_x2": 545.12, "r_y2": 573.69, "r_x3": 308.86, "r_y3": 573.69, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 594.55, "r_x1": 545.12, "r_y1": 594.55, "r_x2": 545.12, "r_y2": 585.64, "r_x3": 308.86, "r_y3": 585.64, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 606.5, "r_x1": 341.23, "r_y1": 606.5, "r_x2": 341.23, "r_y2": 597.6, "r_x3": 308.86, "r_y3": 597.6, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 633.04, "r_x1": 316.77, "r_y1": 633.04, "r_x2": 316.77, "r_y2": 622.29, "r_x3": 308.86, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.31, "r_y0": 633.04, "r_x1": 545.11, "r_y1": 633.04, "r_x2": 545.11, "r_y2": 622.29, "r_x3": 327.31, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 646.99, "r_x1": 357.34, "r_y1": 646.99, "r_x2": 357.34, "r_y2": 636.24, "r_x3": 326.8, "r_y3": 636.24, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 666.33, "r_x1": 545.11, "r_y1": 666.33, "r_x2": 545.11, "r_y2": 657.42, "r_x3": 320.82, "r_y3": 657.42, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 678.28, "r_x1": 545.12, "r_y1": 678.28, "r_x2": 545.12, "r_y2": 669.38, "r_x3": 308.86, "r_y3": 669.38, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 690.24, "r_x1": 545.12, "r_y1": 690.24, "r_x2": 545.12, "r_y2": 681.33, "r_x3": 308.86, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 702.19, "r_x1": 545.12, "r_y1": 702.19, "r_x2": 545.12, "r_y2": 693.29, "r_x3": 308.86, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 714.15, "r_x1": 371.43, "r_y1": 714.15, "r_x2": 371.43, "r_y2": 705.24, "r_x3": 308.86, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 18, "label": "section_header", "bbox": { "l": 132.84, "t": 110.57, "r": 465.38, "b": 135.53, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.84, "r_y0": 121.32, "r_x1": 465.38, "r_y1": 121.32, "r_x2": 465.38, "r_y2": 110.57, "r_x3": 132.84, "r_y3": 110.57, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18, "r_y0": 135.53, "r_x1": 375.04, "r_y1": 135.53, "r_x2": 375.04, "r_y2": 122.26, "r_x3": 220.18, "r_y3": 122.26, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 161.16, "r": 175.96, "b": 171.91, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 171.91, "r_x1": 57.09, "r_y1": 171.91, "r_x2": 57.09, "r_y2": 161.16, "r_x3": 50.11, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.39, "r_y0": 171.91, "r_x1": 175.96, "r_y1": 171.91, "r_x2": 175.96, "r_y2": 161.16, "r_x3": 66.39, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "section_header", "bbox": { "l": 50.11, "t": 180.98, "r": 150.36, "b": 190.83, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 190.83, "r_x1": 64.21, "r_y1": 190.83, "r_x2": 64.21, "r_y2": 180.98, "r_x3": 50.11, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.61, "r_y0": 190.83, "r_x1": 150.36, "r_y1": 190.83, "r_x2": 150.36, "r_y2": 180.98, "r_x3": 73.61, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 199.92, "r": 286.37, "b": 388.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 208.83, "r_x1": 286.36, "r_y1": 208.83, "r_x2": 286.36, "r_y2": 199.92, "r_x3": 62.07, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 220.78, "r_x1": 286.37, "r_y1": 220.78, "r_x2": 286.37, "r_y2": 211.88, "r_x3": 50.11, "r_y3": 211.88, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 232.74, "r_x1": 286.37, "r_y1": 232.74, "r_x2": 286.37, "r_y2": 223.83, "r_x3": 50.11, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 244.69, "r_x1": 286.37, "r_y1": 244.69, "r_x2": 286.37, "r_y2": 235.79, "r_x3": 50.11, "r_y3": 235.79, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 256.65, "r_x1": 286.37, "r_y1": 256.65, "r_x2": 286.37, "r_y2": 247.74, "r_x3": 50.11, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 268.6, "r_x1": 286.37, "r_y1": 268.6, "r_x2": 286.37, "r_y2": 259.7, "r_x3": 50.11, "r_y3": 259.7, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 280.56, "r_x1": 286.37, "r_y1": 280.56, "r_x2": 286.37, "r_y2": 271.65, "r_x3": 50.11, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 292.51, "r_x1": 286.37, "r_y1": 292.51, "r_x2": 286.37, "r_y2": 283.61, "r_x3": 50.11, "r_y3": 283.61, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 304.47, "r_x1": 286.37, "r_y1": 304.47, "r_x2": 286.37, "r_y2": 295.56, "r_x3": 50.11, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 316.42, "r_x1": 286.37, "r_y1": 316.42, "r_x2": 286.37, "r_y2": 307.52, "r_x3": 50.11, "r_y3": 307.52, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 328.38, "r_x1": 286.37, "r_y1": 328.38, "r_x2": 286.37, "r_y2": 319.47, "r_x3": 50.11, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 340.33, "r_x1": 286.37, "r_y1": 340.33, "r_x2": 286.37, "r_y2": 331.43, "r_x3": 50.11, "r_y3": 331.43, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 352.29, "r_x1": 286.37, "r_y1": 352.29, "r_x2": 286.37, "r_y2": 343.38, "r_x3": 50.11, "r_y3": 343.38, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 364.24, "r_x1": 286.37, "r_y1": 364.24, "r_x2": 286.37, "r_y2": 355.34, "r_x3": 50.11, "r_y3": 355.34, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 376.2, "r_x1": 286.37, "r_y1": 376.2, "r_x2": 286.37, "r_y2": 367.29, "r_x3": 50.11, "r_y3": 367.29, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 388.15, "r_x1": 230.8, "r_y1": 388.15, "r_x2": 230.8, "r_y2": 379.25, "r_x3": 50.11, "r_y3": 379.25, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 391.41, "r": 286.37, "b": 627.46, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 400.31, "r_x1": 286.36, "r_y1": 400.31, "r_x2": 286.36, "r_y2": 391.41, "r_x3": 62.07, "r_y3": 391.41, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 412.27, "r_x1": 286.37, "r_y1": 412.27, "r_x2": 286.37, "r_y2": 403.36, "r_x3": 50.11, "r_y3": 403.36, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 424.22, "r_x1": 286.37, "r_y1": 424.22, "r_x2": 286.37, "r_y2": 415.32, "r_x3": 50.11, "r_y3": 415.32, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 436.18, "r_x1": 286.37, "r_y1": 436.18, "r_x2": 286.37, "r_y2": 427.27, "r_x3": 50.11, "r_y3": 427.27, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.13, "r_x1": 286.37, "r_y1": 448.13, "r_x2": 286.37, "r_y2": 439.23, "r_x3": 50.11, "r_y3": 439.23, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.09, "r_x1": 286.37, "r_y1": 460.09, "r_x2": 286.37, "r_y2": 451.18, "r_x3": 50.11, "r_y3": 451.18, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.04, "r_x1": 286.37, "r_y1": 472.04, "r_x2": 286.37, "r_y2": 463.14, "r_x3": 50.11, "r_y3": 463.14, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.0, "r_x1": 286.37, "r_y1": 484.0, "r_x2": 286.37, "r_y2": 475.09, "r_x3": 50.11, "r_y3": 475.09, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 495.95, "r_x1": 286.37, "r_y1": 495.95, "r_x2": 286.37, "r_y2": 487.05, "r_x3": 50.11, "r_y3": 487.05, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 507.91, "r_x1": 286.37, "r_y1": 507.91, "r_x2": 286.37, "r_y2": 499.0, "r_x3": 50.11, "r_y3": 499.0, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 519.86, "r_x1": 286.37, "r_y1": 519.86, "r_x2": 286.37, "r_y2": 510.96, "r_x3": 50.11, "r_y3": 510.96, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.82, "r_x1": 286.37, "r_y1": 531.82, "r_x2": 286.37, "r_y2": 522.91, "r_x3": 50.11, "r_y3": 522.91, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.77, "r_x1": 286.37, "r_y1": 543.77, "r_x2": 286.37, "r_y2": 534.87, "r_x3": 50.11, "r_y3": 534.87, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.73, "r_x1": 286.37, "r_y1": 555.73, "r_x2": 286.37, "r_y2": 546.82, "r_x3": 50.11, "r_y3": 546.82, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.68, "r_x1": 257.47, "r_y1": 567.68, "r_x2": 257.47, "r_y2": 558.78, "r_x3": 50.11, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.95, "r_y0": 567.68, "r_x1": 286.37, "r_y1": 567.68, "r_x2": 286.37, "r_y2": 558.78, "r_x3": 263.95, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.64, "r_x1": 286.37, "r_y1": 579.64, "r_x2": 286.37, "r_y2": 570.73, "r_x3": 50.11, "r_y3": 570.73, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.59, "r_x1": 286.37, "r_y1": 591.59, "r_x2": 286.37, "r_y2": 582.69, "r_x3": 50.11, "r_y3": 582.69, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.55, "r_x1": 286.37, "r_y1": 603.55, "r_x2": 286.37, "r_y2": 594.64, "r_x3": 50.11, "r_y3": 594.64, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.5, "r_x1": 286.37, "r_y1": 615.5, "r_x2": 286.37, "r_y2": 606.6, "r_x3": 50.11, "r_y3": 606.6, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.46, "r_x1": 242.26, "r_y1": 627.46, "r_x2": 242.26, "r_y2": 618.55, "r_x3": 50.11, "r_y3": 618.55, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 630.71, "r": 286.36, "b": 651.57, "coord_origin": "TOPLEFT" }, "confidence": 0.934, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 639.62, "r_x1": 286.36, "r_y1": 639.62, "r_x2": 286.36, "r_y2": 630.71, "r_x3": 62.07, "r_y3": 630.71, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 651.57, "r_x1": 179.9, "r_y1": 651.57, "r_x2": 179.9, "r_y2": 642.67, "r_x3": 50.11, "r_y3": 642.67, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 662.39, "r": 153.61, "b": 672.24, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 672.24, "r_x1": 64.3, "r_y1": 672.24, "r_x2": 64.3, "r_y2": 662.39, "r_x3": 50.11, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.75, "r_y0": 672.24, "r_x1": 153.61, "r_y1": 672.24, "r_x2": 153.61, "r_y2": 662.39, "r_x3": 73.75, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 681.33, "r": 286.37, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 690.24, "r_x1": 286.36, "r_y1": 690.24, "r_x2": 286.36, "r_y2": 681.33, "r_x3": 62.07, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 702.19, "r_x1": 286.37, "r_y1": 702.19, "r_x2": 286.37, "r_y2": 693.29, "r_x3": 50.11, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 714.15, "r_x1": 84.14, "r_y1": 714.15, "r_x2": 84.14, "r_y2": 705.24, "r_x3": 50.11, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.24, "r_y0": 714.15, "r_x1": 286.37, "r_y1": 714.15, "r_x2": 286.37, "r_y2": 705.24, "r_x3": 91.24, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 162.66, "r": 545.12, "b": 207.43, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 171.56, "r_x1": 545.12, "r_y1": 171.56, "r_x2": 545.12, "r_y2": 162.66, "r_x3": 308.86, "r_y3": 162.66, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.52, "r_x1": 545.12, "r_y1": 183.52, "r_x2": 545.12, "r_y2": 174.61, "r_x3": 308.86, "r_y3": 174.61, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 195.47, "r_x1": 545.12, "r_y1": 195.47, "r_x2": 545.12, "r_y2": 186.57, "r_x3": 308.86, "r_y3": 186.57, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 207.43, "r_x1": 484.07, "r_y1": 207.43, "r_x2": 484.07, "r_y2": 198.52, "r_x3": 308.86, "r_y3": 198.52, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 308.86, "t": 211.24, "r": 545.12, "b": 232.1, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 220.14, "r_x1": 545.12, "r_y1": 220.14, "r_x2": 545.12, "r_y2": 211.24, "r_x3": 320.82, "r_y3": 211.24, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.1, "r_x1": 448.09, "r_y1": 232.1, "r_x2": 448.09, "r_y2": 223.19, "r_x3": 308.86, "r_y3": 223.19, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 308.86, "t": 235.91, "r": 545.12, "b": 316.54, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 244.81, "r_x1": 328.29, "r_y1": 244.81, "r_x2": 328.29, "r_y2": 235.91, "r_x3": 320.82, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38, "r_y0": 244.81, "r_x1": 545.11, "r_y1": 244.81, "r_x2": 545.11, "r_y2": 235.91, "r_x3": 335.38, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.77, "r_x1": 545.12, "r_y1": 256.77, "r_x2": 545.12, "r_y2": 247.86, "r_x3": 308.86, "r_y3": 247.86, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.72, "r_x1": 545.12, "r_y1": 268.72, "r_x2": 545.12, "r_y2": 259.82, "r_x3": 308.86, "r_y3": 259.82, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.68, "r_x1": 393.38, "r_y1": 280.68, "r_x2": 393.38, "r_y2": 271.77, "r_x3": 308.86, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.12, "r_y0": 280.68, "r_x1": 545.12, "r_y1": 280.68, "r_x2": 545.12, "r_y2": 271.77, "r_x3": 400.12, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.63, "r_x1": 545.12, "r_y1": 292.63, "r_x2": 545.12, "r_y2": 283.73, "r_x3": 308.86, "r_y3": 283.73, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.59, "r_x1": 545.12, "r_y1": 304.59, "r_x2": 545.12, "r_y2": 295.68, "r_x3": 308.86, "r_y3": 295.68, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.54, "r_x1": 425.69, "r_y1": 316.54, "r_x2": 425.69, "r_y2": 307.64, "r_x3": 308.86, "r_y3": 307.64, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 320.35, "r": 545.12, "b": 448.81, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 329.26, "r_x1": 328.49, "r_y1": 329.26, "r_x2": 328.49, "r_y2": 320.35, "r_x3": 320.82, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05, "r_y0": 329.26, "r_x1": 545.11, "r_y1": 329.26, "r_x2": 545.11, "r_y2": 320.35, "r_x3": 331.05, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 341.21, "r_x1": 545.12, "r_y1": 341.21, "r_x2": 545.12, "r_y2": 332.31, "r_x3": 308.86, "r_y3": 332.31, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 353.17, "r_x1": 545.12, "r_y1": 353.17, "r_x2": 545.12, "r_y2": 344.26, "r_x3": 308.86, "r_y3": 344.26, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 365.12, "r_x1": 545.12, "r_y1": 365.12, "r_x2": 545.12, "r_y2": 356.22, "r_x3": 308.86, "r_y3": 356.22, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 377.08, "r_x1": 545.12, "r_y1": 377.08, "r_x2": 545.12, "r_y2": 368.17, "r_x3": 308.86, "r_y3": 368.17, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 389.03, "r_x1": 545.11, "r_y1": 389.03, "r_x2": 545.11, "r_y2": 380.13, "r_x3": 308.86, "r_y3": 380.13, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.99, "r_x1": 545.12, "r_y1": 400.99, "r_x2": 545.12, "r_y2": 392.08, "r_x3": 308.86, "r_y3": 392.08, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.94, "r_x1": 545.12, "r_y1": 412.94, "r_x2": 545.12, "r_y2": 404.04, "r_x3": 308.86, "r_y3": 404.04, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.9, "r_x1": 545.11, "r_y1": 424.9, "r_x2": 545.11, "r_y2": 415.99, "r_x3": 308.86, "r_y3": 415.99, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.85, "r_x1": 545.12, "r_y1": 436.85, "r_x2": 545.12, "r_y2": 427.95, "r_x3": 308.86, "r_y3": 427.95, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.81, "r_x1": 345.94, "r_y1": 448.81, "r_x2": 345.94, "r_y2": 439.9, "r_x3": 308.86, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 452.62, "r": 545.12, "b": 497.39, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 461.52, "r_x1": 328.3, "r_y1": 461.52, "r_x2": 328.3, "r_y2": 452.62, "r_x3": 320.82, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.8, "r_y0": 461.52, "r_x1": 485.76, "r_y1": 461.52, "r_x2": 485.76, "r_y2": 452.62, "r_x3": 330.8, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.07, "r_y0": 461.29, "r_x1": 511.86, "r_y1": 461.29, "r_x2": 511.86, "r_y2": 452.71, "r_x3": 488.07, "r_y3": 452.71, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86, "r_y0": 461.52, "r_x1": 545.11, "r_y1": 461.52, "r_x2": 545.11, "r_y2": 452.62, "r_x3": 511.86, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.48, "r_x1": 545.12, "r_y1": 473.48, "r_x2": 545.12, "r_y2": 464.57, "r_x3": 308.86, "r_y3": 464.57, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.43, "r_x1": 545.12, "r_y1": 485.43, "r_x2": 545.12, "r_y2": 476.53, "r_x3": 308.86, "r_y3": 476.53, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.39, "r_x1": 379.15, "r_y1": 497.39, "r_x2": 379.15, "r_y2": 488.48, "r_x3": 308.86, "r_y3": 488.48, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 308.86, "t": 501.2, "r": 545.12, "b": 545.97, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 510.1, "r_x1": 328.66, "r_y1": 510.1, "r_x2": 328.66, "r_y2": 501.2, "r_x3": 320.82, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.28, "r_y0": 510.1, "r_x1": 545.11, "r_y1": 510.1, "r_x2": 545.11, "r_y2": 501.2, "r_x3": 331.28, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 522.06, "r_x1": 545.12, "r_y1": 522.06, "r_x2": 545.12, "r_y2": 513.15, "r_x3": 308.86, "r_y3": 513.15, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 534.01, "r_x1": 384.3, "r_y1": 534.01, "r_x2": 384.3, "r_y2": 525.11, "r_x3": 308.86, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25, "r_y0": 534.01, "r_x1": 545.12, "r_y1": 534.01, "r_x2": 545.12, "r_y2": 525.11, "r_x3": 391.25, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.97, "r_x1": 496.16, "r_y1": 545.97, "r_x2": 496.16, "r_y2": 537.06, "r_x3": 308.86, "r_y3": 537.06, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 308.86, "t": 549.78, "r": 545.12, "b": 606.5, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 558.68, "r_x1": 328.29, "r_y1": 558.68, "r_x2": 328.29, "r_y2": 549.78, "r_x3": 320.82, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.4, "r_y0": 558.68, "r_x1": 545.11, "r_y1": 558.68, "r_x2": 545.11, "r_y2": 549.78, "r_x3": 335.4, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 570.64, "r_x1": 545.12, "r_y1": 570.64, "r_x2": 545.12, "r_y2": 561.73, "r_x3": 308.86, "r_y3": 561.73, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 582.59, "r_x1": 545.12, "r_y1": 582.59, "r_x2": 545.12, "r_y2": 573.69, "r_x3": 308.86, "r_y3": 573.69, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 594.55, "r_x1": 545.12, "r_y1": 594.55, "r_x2": 545.12, "r_y2": 585.64, "r_x3": 308.86, "r_y3": 585.64, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 606.5, "r_x1": 341.23, "r_y1": 606.5, "r_x2": 341.23, "r_y2": 597.6, "r_x3": 308.86, "r_y3": 597.6, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "section_header", "bbox": { "l": 308.86, "t": 622.29, "r": 545.11, "b": 646.99, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 633.04, "r_x1": 316.77, "r_y1": 633.04, "r_x2": 316.77, "r_y2": 622.29, "r_x3": 308.86, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.31, "r_y0": 633.04, "r_x1": 545.11, "r_y1": 633.04, "r_x2": 545.11, "r_y2": 622.29, "r_x3": 327.31, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 646.99, "r_x1": 357.34, "r_y1": 646.99, "r_x2": 357.34, "r_y2": 636.24, "r_x3": 326.8, "r_y3": 636.24, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 657.42, "r": 545.12, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 666.33, "r_x1": 545.11, "r_y1": 666.33, "r_x2": 545.11, "r_y2": 657.42, "r_x3": 320.82, "r_y3": 657.42, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 678.28, "r_x1": 545.12, "r_y1": 678.28, "r_x2": 545.12, "r_y2": 669.38, "r_x3": 308.86, "r_y3": 669.38, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 690.24, "r_x1": 545.12, "r_y1": 690.24, "r_x2": 545.12, "r_y2": 681.33, "r_x3": 308.86, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 702.19, "r_x1": 545.12, "r_y1": 702.19, "r_x2": 545.12, "r_y2": 693.29, "r_x3": 308.86, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 714.15, "r_x1": 371.43, "r_y1": 714.15, "r_x2": 371.43, "r_y2": 705.24, "r_x3": 308.86, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.899, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 18, "page_no": 10, "cluster": { "id": 18, "label": "section_header", "bbox": { "l": 132.84, "t": 110.57, "r": 465.38, "b": 135.53, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.84, "r_y0": 121.32, "r_x1": 465.38, "r_y1": 121.32, "r_x2": 465.38, "r_y2": 110.57, "r_x3": 132.84, "r_y3": 110.57, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18, "r_y0": 135.53, "r_x1": 375.04, "r_y1": 135.53, "r_x2": 375.04, "r_y2": 122.26, "r_x3": 220.18, "r_y3": 122.26, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material" }, { "label": "section_header", "id": 13, "page_no": 10, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 161.16, "r": 175.96, "b": 171.91, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 171.91, "r_x1": 57.09, "r_y1": 171.91, "r_x2": 57.09, "r_y2": 161.16, "r_x3": 50.11, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.39, "r_y0": 171.91, "r_x1": 175.96, "r_y1": 171.91, "r_x2": 175.96, "r_y2": 161.16, "r_x3": 66.39, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Details on the datasets" }, { "label": "section_header", "id": 11, "page_no": 10, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 50.11, "t": 180.98, "r": 150.36, "b": 190.83, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 190.83, "r_x1": 64.21, "r_y1": 190.83, "r_x2": 64.21, "r_y2": 180.98, "r_x3": 50.11, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.61, "r_y0": 190.83, "r_x1": 150.36, "r_y1": 190.83, "r_x2": 150.36, "r_y2": 180.98, "r_x3": 73.61, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.1. Data preparation" }, { "label": "text", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 199.92, "r": 286.37, "b": 388.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 208.83, "r_x1": 286.36, "r_y1": 208.83, "r_x2": 286.36, "r_y2": 199.92, "r_x3": 62.07, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 220.78, "r_x1": 286.37, "r_y1": 220.78, "r_x2": 286.37, "r_y2": 211.88, "r_x3": 50.11, "r_y3": 211.88, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 232.74, "r_x1": 286.37, "r_y1": 232.74, "r_x2": 286.37, "r_y2": 223.83, "r_x3": 50.11, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 244.69, "r_x1": 286.37, "r_y1": 244.69, "r_x2": 286.37, "r_y2": 235.79, "r_x3": 50.11, "r_y3": 235.79, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 256.65, "r_x1": 286.37, "r_y1": 256.65, "r_x2": 286.37, "r_y2": 247.74, "r_x3": 50.11, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 268.6, "r_x1": 286.37, "r_y1": 268.6, "r_x2": 286.37, "r_y2": 259.7, "r_x3": 50.11, "r_y3": 259.7, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 280.56, "r_x1": 286.37, "r_y1": 280.56, "r_x2": 286.37, "r_y2": 271.65, "r_x3": 50.11, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 292.51, "r_x1": 286.37, "r_y1": 292.51, "r_x2": 286.37, "r_y2": 283.61, "r_x3": 50.11, "r_y3": 283.61, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 304.47, "r_x1": 286.37, "r_y1": 304.47, "r_x2": 286.37, "r_y2": 295.56, "r_x3": 50.11, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 316.42, "r_x1": 286.37, "r_y1": 316.42, "r_x2": 286.37, "r_y2": 307.52, "r_x3": 50.11, "r_y3": 307.52, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 328.38, "r_x1": 286.37, "r_y1": 328.38, "r_x2": 286.37, "r_y2": 319.47, "r_x3": 50.11, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 340.33, "r_x1": 286.37, "r_y1": 340.33, "r_x2": 286.37, "r_y2": 331.43, "r_x3": 50.11, "r_y3": 331.43, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 352.29, "r_x1": 286.37, "r_y1": 352.29, "r_x2": 286.37, "r_y2": 343.38, "r_x3": 50.11, "r_y3": 343.38, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 364.24, "r_x1": 286.37, "r_y1": 364.24, "r_x2": 286.37, "r_y2": 355.34, "r_x3": 50.11, "r_y3": 355.34, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 376.2, "r_x1": 286.37, "r_y1": 376.2, "r_x2": 286.37, "r_y2": 367.29, "r_x3": 50.11, "r_y3": 367.29, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 388.15, "r_x1": 230.8, "r_y1": 388.15, "r_x2": 230.8, "r_y2": 379.25, "r_x3": 50.11, "r_y3": 379.25, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length." }, { "label": "text", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 391.41, "r": 286.37, "b": 627.46, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 400.31, "r_x1": 286.36, "r_y1": 400.31, "r_x2": 286.36, "r_y2": 391.41, "r_x3": 62.07, "r_y3": 391.41, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 412.27, "r_x1": 286.37, "r_y1": 412.27, "r_x2": 286.37, "r_y2": 403.36, "r_x3": 50.11, "r_y3": 403.36, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 424.22, "r_x1": 286.37, "r_y1": 424.22, "r_x2": 286.37, "r_y2": 415.32, "r_x3": 50.11, "r_y3": 415.32, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 436.18, "r_x1": 286.37, "r_y1": 436.18, "r_x2": 286.37, "r_y2": 427.27, "r_x3": 50.11, "r_y3": 427.27, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.13, "r_x1": 286.37, "r_y1": 448.13, "r_x2": 286.37, "r_y2": 439.23, "r_x3": 50.11, "r_y3": 439.23, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.09, "r_x1": 286.37, "r_y1": 460.09, "r_x2": 286.37, "r_y2": 451.18, "r_x3": 50.11, "r_y3": 451.18, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.04, "r_x1": 286.37, "r_y1": 472.04, "r_x2": 286.37, "r_y2": 463.14, "r_x3": 50.11, "r_y3": 463.14, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.0, "r_x1": 286.37, "r_y1": 484.0, "r_x2": 286.37, "r_y2": 475.09, "r_x3": 50.11, "r_y3": 475.09, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 495.95, "r_x1": 286.37, "r_y1": 495.95, "r_x2": 286.37, "r_y2": 487.05, "r_x3": 50.11, "r_y3": 487.05, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 507.91, "r_x1": 286.37, "r_y1": 507.91, "r_x2": 286.37, "r_y2": 499.0, "r_x3": 50.11, "r_y3": 499.0, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 519.86, "r_x1": 286.37, "r_y1": 519.86, "r_x2": 286.37, "r_y2": 510.96, "r_x3": 50.11, "r_y3": 510.96, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.82, "r_x1": 286.37, "r_y1": 531.82, "r_x2": 286.37, "r_y2": 522.91, "r_x3": 50.11, "r_y3": 522.91, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.77, "r_x1": 286.37, "r_y1": 543.77, "r_x2": 286.37, "r_y2": 534.87, "r_x3": 50.11, "r_y3": 534.87, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.73, "r_x1": 286.37, "r_y1": 555.73, "r_x2": 286.37, "r_y2": 546.82, "r_x3": 50.11, "r_y3": 546.82, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.68, "r_x1": 257.47, "r_y1": 567.68, "r_x2": 257.47, "r_y2": 558.78, "r_x3": 50.11, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.95, "r_y0": 567.68, "r_x1": 286.37, "r_y1": 567.68, "r_x2": 286.37, "r_y2": 558.78, "r_x3": 263.95, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.64, "r_x1": 286.37, "r_y1": 579.64, "r_x2": 286.37, "r_y2": 570.73, "r_x3": 50.11, "r_y3": 570.73, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.59, "r_x1": 286.37, "r_y1": 591.59, "r_x2": 286.37, "r_y2": 582.69, "r_x3": 50.11, "r_y3": 582.69, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.55, "r_x1": 286.37, "r_y1": 603.55, "r_x2": 286.37, "r_y2": 594.64, "r_x3": 50.11, "r_y3": 594.64, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.5, "r_x1": 286.37, "r_y1": 615.5, "r_x2": 286.37, "r_y2": 606.6, "r_x3": 50.11, "r_y3": 606.6, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.46, "r_x1": 242.26, "r_y1": 627.46, "r_x2": 242.26, "r_y2": 618.55, "r_x3": 50.11, "r_y3": 618.55, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 14, "page_no": 10, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 630.71, "r": 286.36, "b": 651.57, "coord_origin": "TOPLEFT" }, "confidence": 0.934, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 639.62, "r_x1": 286.36, "r_y1": 639.62, "r_x2": 286.36, "r_y2": 630.71, "r_x3": 62.07, "r_y3": 630.71, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 651.57, "r_x1": 179.9, "r_y1": 651.57, "r_x2": 179.9, "r_y2": 642.67, "r_x3": 50.11, "r_y3": 642.67, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset." }, { "label": "section_header", "id": 12, "page_no": 10, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 662.39, "r": 153.61, "b": 672.24, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 672.24, "r_x1": 64.3, "r_y1": 672.24, "r_x2": 64.3, "r_y2": 662.39, "r_x3": 50.11, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.75, "r_y0": 672.24, "r_x1": 153.61, "r_y1": 672.24, "r_x2": 153.61, "r_y2": 662.39, "r_x3": 73.75, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.2. Synthetic datasets" }, { "label": "text", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 681.33, "r": 286.37, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 690.24, "r_x1": 286.36, "r_y1": 690.24, "r_x2": 286.36, "r_y2": 681.33, "r_x3": 62.07, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 702.19, "r_x1": 286.37, "r_y1": 702.19, "r_x2": 286.37, "r_y2": 693.29, "r_x3": 50.11, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 714.15, "r_x1": 84.14, "r_y1": 714.15, "r_x2": 84.14, "r_y2": 705.24, "r_x3": 50.11, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.24, "r_y0": 714.15, "r_x1": 286.37, "r_y1": 714.15, "r_x2": 286.37, "r_y2": 705.24, "r_x3": 91.24, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-" }, { "label": "text", "id": 8, "page_no": 10, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 162.66, "r": 545.12, "b": 207.43, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 171.56, "r_x1": 545.12, "r_y1": 171.56, "r_x2": 545.12, "r_y2": 162.66, "r_x3": 308.86, "r_y3": 162.66, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.52, "r_x1": 545.12, "r_y1": 183.52, "r_x2": 545.12, "r_y2": 174.61, "r_x3": 308.86, "r_y3": 174.61, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 195.47, "r_x1": 545.12, "r_y1": 195.47, "r_x2": 545.12, "r_y2": 186.57, "r_x3": 308.86, "r_y3": 186.57, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 207.43, "r_x1": 484.07, "r_y1": 207.43, "r_x2": 484.07, "r_y2": 198.52, "r_x3": 308.86, "r_y3": 198.52, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)." }, { "label": "text", "id": 15, "page_no": 10, "cluster": { "id": 15, "label": "text", "bbox": { "l": 308.86, "t": 211.24, "r": 545.12, "b": 232.1, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 220.14, "r_x1": 545.12, "r_y1": 220.14, "r_x2": 545.12, "r_y2": 211.24, "r_x3": 320.82, "r_y3": 211.24, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.1, "r_x1": 448.09, "r_y1": 232.1, "r_x2": 448.09, "r_y2": 223.19, "r_x3": 308.86, "r_y3": 223.19, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:" }, { "label": "list_item", "id": 7, "page_no": 10, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 308.86, "t": 235.91, "r": 545.12, "b": 316.54, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 244.81, "r_x1": 328.29, "r_y1": 244.81, "r_x2": 328.29, "r_y2": 235.91, "r_x3": 320.82, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38, "r_y0": 244.81, "r_x1": 545.11, "r_y1": 244.81, "r_x2": 545.11, "r_y2": 235.91, "r_x3": 335.38, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.77, "r_x1": 545.12, "r_y1": 256.77, "r_x2": 545.12, "r_y2": 247.86, "r_x3": 308.86, "r_y3": 247.86, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.72, "r_x1": 545.12, "r_y1": 268.72, "r_x2": 545.12, "r_y2": 259.82, "r_x3": 308.86, "r_y3": 259.82, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.68, "r_x1": 393.38, "r_y1": 280.68, "r_x2": 393.38, "r_y2": 271.77, "r_x3": 308.86, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.12, "r_y0": 280.68, "r_x1": 545.12, "r_y1": 280.68, "r_x2": 545.12, "r_y2": 271.77, "r_x3": 400.12, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.63, "r_x1": 545.12, "r_y1": 292.63, "r_x2": 545.12, "r_y2": 283.73, "r_x3": 308.86, "r_y3": 283.73, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.59, "r_x1": 545.12, "r_y1": 304.59, "r_x2": 545.12, "r_y2": 295.68, "r_x3": 308.86, "r_y3": 295.68, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.54, "r_x1": 425.69, "r_y1": 316.54, "r_x2": 425.69, "r_y2": 307.64, "r_x3": 308.86, "r_y3": 307.64, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)." }, { "label": "list_item", "id": 6, "page_no": 10, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 320.35, "r": 545.12, "b": 448.81, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 329.26, "r_x1": 328.49, "r_y1": 329.26, "r_x2": 328.49, "r_y2": 320.35, "r_x3": 320.82, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05, "r_y0": 329.26, "r_x1": 545.11, "r_y1": 329.26, "r_x2": 545.11, "r_y2": 320.35, "r_x3": 331.05, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 341.21, "r_x1": 545.12, "r_y1": 341.21, "r_x2": 545.12, "r_y2": 332.31, "r_x3": 308.86, "r_y3": 332.31, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 353.17, "r_x1": 545.12, "r_y1": 353.17, "r_x2": 545.12, "r_y2": 344.26, "r_x3": 308.86, "r_y3": 344.26, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 365.12, "r_x1": 545.12, "r_y1": 365.12, "r_x2": 545.12, "r_y2": 356.22, "r_x3": 308.86, "r_y3": 356.22, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 377.08, "r_x1": 545.12, "r_y1": 377.08, "r_x2": 545.12, "r_y2": 368.17, "r_x3": 308.86, "r_y3": 368.17, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 389.03, "r_x1": 545.11, "r_y1": 389.03, "r_x2": 545.11, "r_y2": 380.13, "r_x3": 308.86, "r_y3": 380.13, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.99, "r_x1": 545.12, "r_y1": 400.99, "r_x2": 545.12, "r_y2": 392.08, "r_x3": 308.86, "r_y3": 392.08, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.94, "r_x1": 545.12, "r_y1": 412.94, "r_x2": 545.12, "r_y2": 404.04, "r_x3": 308.86, "r_y3": 404.04, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.9, "r_x1": 545.11, "r_y1": 424.9, "r_x2": 545.11, "r_y2": 415.99, "r_x3": 308.86, "r_y3": 415.99, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.85, "r_x1": 545.12, "r_y1": 436.85, "r_x2": 545.12, "r_y2": 427.95, "r_x3": 308.86, "r_y3": 427.95, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.81, "r_x1": 345.94, "r_y1": 448.81, "r_x2": 345.94, "r_y2": 439.9, "r_x3": 308.86, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans." }, { "label": "list_item", "id": 9, "page_no": 10, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 452.62, "r": 545.12, "b": 497.39, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 461.52, "r_x1": 328.3, "r_y1": 461.52, "r_x2": 328.3, "r_y2": 452.62, "r_x3": 320.82, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.8, "r_y0": 461.52, "r_x1": 485.76, "r_y1": 461.52, "r_x2": 485.76, "r_y2": 452.62, "r_x3": 330.8, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.07, "r_y0": 461.29, "r_x1": 511.86, "r_y1": 461.29, "r_x2": 511.86, "r_y2": 452.71, "r_x3": 488.07, "r_y3": 452.71, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86, "r_y0": 461.52, "r_x1": 545.11, "r_y1": 461.52, "r_x2": 545.11, "r_y2": 452.62, "r_x3": 511.86, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.48, "r_x1": 545.12, "r_y1": 473.48, "r_x2": 545.12, "r_y2": 464.57, "r_x3": 308.86, "r_y3": 464.57, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.43, "r_x1": 545.12, "r_y1": 485.43, "r_x2": 545.12, "r_y2": 476.53, "r_x3": 308.86, "r_y3": 476.53, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.39, "r_x1": 379.15, "r_y1": 497.39, "r_x2": 379.15, "r_y2": 488.48, "r_x3": 308.86, "r_y3": 488.48, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content." }, { "label": "list_item", "id": 5, "page_no": 10, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 308.86, "t": 501.2, "r": 545.12, "b": 545.97, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 510.1, "r_x1": 328.66, "r_y1": 510.1, "r_x2": 328.66, "r_y2": 501.2, "r_x3": 320.82, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.28, "r_y0": 510.1, "r_x1": 545.11, "r_y1": 510.1, "r_x2": 545.11, "r_y2": 501.2, "r_x3": 331.28, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 522.06, "r_x1": 545.12, "r_y1": 522.06, "r_x2": 545.12, "r_y2": 513.15, "r_x3": 308.86, "r_y3": 513.15, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 534.01, "r_x1": 384.3, "r_y1": 534.01, "r_x2": 384.3, "r_y2": 525.11, "r_x3": 308.86, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25, "r_y0": 534.01, "r_x1": 545.12, "r_y1": 534.01, "r_x2": 545.12, "r_y2": 525.11, "r_x3": 391.25, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.97, "r_x1": 496.16, "r_y1": 545.97, "r_x2": 496.16, "r_y2": 537.06, "r_x3": 308.86, "r_y3": 537.06, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table." }, { "label": "list_item", "id": 4, "page_no": 10, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 308.86, "t": 549.78, "r": 545.12, "b": 606.5, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 558.68, "r_x1": 328.29, "r_y1": 558.68, "r_x2": 328.29, "r_y2": 549.78, "r_x3": 320.82, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.4, "r_y0": 558.68, "r_x1": 545.11, "r_y1": 558.68, "r_x2": 545.11, "r_y2": 549.78, "r_x3": 335.4, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 570.64, "r_x1": 545.12, "r_y1": 570.64, "r_x2": 545.12, "r_y2": 561.73, "r_x3": 308.86, "r_y3": 561.73, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 582.59, "r_x1": 545.12, "r_y1": 582.59, "r_x2": 545.12, "r_y2": 573.69, "r_x3": 308.86, "r_y3": 573.69, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 594.55, "r_x1": 545.12, "r_y1": 594.55, "r_x2": 545.12, "r_y2": 585.64, "r_x3": 308.86, "r_y3": 585.64, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 606.5, "r_x1": 341.23, "r_y1": 606.5, "r_x2": 341.23, "r_y2": 597.6, "r_x3": 308.86, "r_y3": 597.6, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process." }, { "label": "section_header", "id": 10, "page_no": 10, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 308.86, "t": 622.29, "r": 545.11, "b": 646.99, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 633.04, "r_x1": 316.77, "r_y1": 633.04, "r_x2": 316.77, "r_y2": 622.29, "r_x3": 308.86, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.31, "r_y0": 633.04, "r_x1": 545.11, "r_y1": 633.04, "r_x2": 545.11, "r_y2": 622.29, "r_x3": 327.31, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 646.99, "r_x1": 357.34, "r_y1": 646.99, "r_x2": 357.34, "r_y2": 636.24, "r_x3": 326.8, "r_y3": 636.24, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Prediction post-processing for PDF documents" }, { "label": "text", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 657.42, "r": 545.12, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 666.33, "r_x1": 545.11, "r_y1": 666.33, "r_x2": 545.11, "r_y2": 657.42, "r_x3": 320.82, "r_y3": 657.42, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 678.28, "r_x1": 545.12, "r_y1": 678.28, "r_x2": 545.12, "r_y2": 669.38, "r_x3": 308.86, "r_y3": 669.38, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 690.24, "r_x1": 545.12, "r_y1": 690.24, "r_x2": 545.12, "r_y2": 681.33, "r_x3": 308.86, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 702.19, "r_x1": 545.12, "r_y1": 702.19, "r_x2": 545.12, "r_y2": 693.29, "r_x3": 308.86, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 714.15, "r_x1": 371.43, "r_y1": 714.15, "r_x2": 371.43, "r_y2": 705.24, "r_x3": 308.86, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:" }, { "label": "page_footer", "id": 16, "page_no": 10, "cluster": { "id": 16, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.899, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ], "body": [ { "label": "section_header", "id": 18, "page_no": 10, "cluster": { "id": 18, "label": "section_header", "bbox": { "l": 132.84, "t": 110.57, "r": 465.38, "b": 135.53, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.84, "r_y0": 121.32, "r_x1": 465.38, "r_y1": 121.32, "r_x2": 465.38, "r_y2": 110.57, "r_x3": 132.84, "r_y3": 110.57, "coord_origin": "TOPLEFT" }, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.18, "r_y0": 135.53, "r_x1": 375.04, "r_y1": 135.53, "r_x2": 375.04, "r_y2": 122.26, "r_x3": 220.18, "r_y3": 122.26, "coord_origin": "TOPLEFT" }, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material" }, { "label": "section_header", "id": 13, "page_no": 10, "cluster": { "id": 13, "label": "section_header", "bbox": { "l": 50.11, "t": 161.16, "r": 175.96, "b": 171.91, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 171.91, "r_x1": 57.09, "r_y1": 171.91, "r_x2": 57.09, "r_y2": 161.16, "r_x3": 50.11, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 66.39, "r_y0": 171.91, "r_x1": 175.96, "r_y1": 171.91, "r_x2": 175.96, "r_y2": 161.16, "r_x3": 66.39, "r_y3": 161.16, "coord_origin": "TOPLEFT" }, "text": "Details on the datasets", "orig": "Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Details on the datasets" }, { "label": "section_header", "id": 11, "page_no": 10, "cluster": { "id": 11, "label": "section_header", "bbox": { "l": 50.11, "t": 180.98, "r": 150.36, "b": 190.83, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 190.83, "r_x1": 64.21, "r_y1": 190.83, "r_x2": 64.21, "r_y2": 180.98, "r_x3": 50.11, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "1.1.", "orig": "1.1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.61, "r_y0": 190.83, "r_x1": 150.36, "r_y1": 190.83, "r_x2": 150.36, "r_y2": 180.98, "r_x3": 73.61, "r_y3": 180.98, "coord_origin": "TOPLEFT" }, "text": "Data preparation", "orig": "Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.1. Data preparation" }, { "label": "text", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 199.92, "r": 286.37, "b": 388.15, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 208.83, "r_x1": 286.36, "r_y1": 208.83, "r_x2": 286.36, "r_y2": 199.92, "r_x3": 62.07, "r_y3": 199.92, "coord_origin": "TOPLEFT" }, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 220.78, "r_x1": 286.37, "r_y1": 220.78, "r_x2": 286.37, "r_y2": 211.88, "r_x3": 50.11, "r_y3": 211.88, "coord_origin": "TOPLEFT" }, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 232.74, "r_x1": 286.37, "r_y1": 232.74, "r_x2": 286.37, "r_y2": 223.83, "r_x3": 50.11, "r_y3": 223.83, "coord_origin": "TOPLEFT" }, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 244.69, "r_x1": 286.37, "r_y1": 244.69, "r_x2": 286.37, "r_y2": 235.79, "r_x3": 50.11, "r_y3": 235.79, "coord_origin": "TOPLEFT" }, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 256.65, "r_x1": 286.37, "r_y1": 256.65, "r_x2": 286.37, "r_y2": 247.74, "r_x3": 50.11, "r_y3": 247.74, "coord_origin": "TOPLEFT" }, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 268.6, "r_x1": 286.37, "r_y1": 268.6, "r_x2": 286.37, "r_y2": 259.7, "r_x3": 50.11, "r_y3": 259.7, "coord_origin": "TOPLEFT" }, "text": "omitted bounding boxes). A table is considered to be simple", "orig": "omitted bounding boxes). A table is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 280.56, "r_x1": 286.37, "r_y1": 280.56, "r_x2": 286.37, "r_y2": 271.65, "r_x3": 50.11, "r_y3": 271.65, "coord_origin": "TOPLEFT" }, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 292.51, "r_x1": 286.37, "r_y1": 292.51, "r_x2": 286.37, "r_y2": 283.61, "r_x3": 50.11, "r_y3": 283.61, "coord_origin": "TOPLEFT" }, "text": "ally, a table has a strict HTML structure if every row has the", "orig": "ally, a table has a strict HTML structure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 304.47, "r_x1": 286.37, "r_y1": 304.47, "r_x2": 286.37, "r_y2": 295.56, "r_x3": 50.11, "r_y3": 295.56, "coord_origin": "TOPLEFT" }, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 316.42, "r_x1": 286.37, "r_y1": 316.42, "r_x2": 286.37, "r_y2": 307.52, "r_x3": 50.11, "r_y3": 307.52, "coord_origin": "TOPLEFT" }, "text": "or column spans. Therefore a strict HTML structure looks", "orig": "or column spans. Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 328.38, "r_x1": 286.37, "r_y1": 328.38, "r_x2": 286.37, "r_y2": 319.47, "r_x3": 50.11, "r_y3": 319.47, "coord_origin": "TOPLEFT" }, "text": "always rectangular. However, HTML is a lenient encoding", "orig": "always rectangular. However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 340.33, "r_x1": 286.37, "r_y1": 340.33, "r_x2": 286.37, "r_y2": 331.43, "r_x3": 50.11, "r_y3": 331.43, "coord_origin": "TOPLEFT" }, "text": "format, i.e. tables with rows of different sizes might still", "orig": "format, i.e. tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 352.29, "r_x1": 286.37, "r_y1": 352.29, "r_x2": 286.37, "r_y2": 343.38, "r_x3": 50.11, "r_y3": 343.38, "coord_origin": "TOPLEFT" }, "text": "be regarded as correct due to implicit display rules. These", "orig": "be regarded as correct due to implicit display rules. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 364.24, "r_x1": 286.37, "r_y1": 364.24, "r_x2": 286.37, "r_y2": 355.34, "r_x3": 50.11, "r_y3": 355.34, "coord_origin": "TOPLEFT" }, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 376.2, "r_x1": 286.37, "r_y1": 376.2, "r_x2": 286.37, "r_y2": 367.29, "r_x3": 50.11, "r_y3": 367.29, "coord_origin": "TOPLEFT" }, "text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 388.15, "r_x1": 230.8, "r_y1": 388.15, "r_x2": 230.8, "r_y2": 379.25, "r_x3": 50.11, "r_y3": 379.25, "coord_origin": "TOPLEFT" }, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length." }, { "label": "text", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "text", "bbox": { "l": 50.11, "t": 391.41, "r": 286.37, "b": 627.46, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 400.31, "r_x1": 286.36, "r_y1": 400.31, "r_x2": 286.36, "r_y2": 391.41, "r_x3": 62.07, "r_y3": 391.41, "coord_origin": "TOPLEFT" }, "text": "We have developed a technique that tries to derive a", "orig": "We have developed a technique that tries to derive a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 412.27, "r_x1": 286.37, "r_y1": 412.27, "r_x2": 286.37, "r_y2": 403.36, "r_x3": 50.11, "r_y3": 403.36, "coord_origin": "TOPLEFT" }, "text": "missing bounding box out of its neighbors. As a first step,", "orig": "missing bounding box out of its neighbors. As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 424.22, "r_x1": 286.37, "r_y1": 424.22, "r_x2": 286.37, "r_y2": 415.32, "r_x3": 50.11, "r_y3": 415.32, "coord_origin": "TOPLEFT" }, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 436.18, "r_x1": 286.37, "r_y1": 436.18, "r_x2": 286.37, "r_y2": 427.27, "r_x3": 50.11, "r_y3": 427.27, "coord_origin": "TOPLEFT" }, "text": "grid that covers the table structure. In case of strict HTML", "orig": "grid that covers the table structure. In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 448.13, "r_x1": 286.37, "r_y1": 448.13, "r_x2": 286.37, "r_y2": 439.23, "r_x3": 50.11, "r_y3": 439.23, "coord_origin": "TOPLEFT" }, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 460.09, "r_x1": 286.37, "r_y1": 460.09, "r_x2": 286.37, "r_y2": 451.18, "r_x3": 50.11, "r_y3": 451.18, "coord_origin": "TOPLEFT" }, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 472.04, "r_x1": 286.37, "r_y1": 472.04, "r_x2": 286.37, "r_y2": 463.14, "r_x3": 50.11, "r_y3": 463.14, "coord_origin": "TOPLEFT" }, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 484.0, "r_x1": 286.37, "r_y1": 484.0, "r_x2": 286.37, "r_y2": 475.09, "r_x3": 50.11, "r_y3": 475.09, "coord_origin": "TOPLEFT" }, "text": "for a rectangular table, it is possible to compute the geo-", "orig": "for a rectangular table, it is possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 495.95, "r_x1": 286.37, "r_y1": 495.95, "r_x2": 286.37, "r_y2": 487.05, "r_x3": 50.11, "r_y3": 487.05, "coord_origin": "TOPLEFT" }, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 507.91, "r_x1": 286.37, "r_y1": 507.91, "r_x2": 286.37, "r_y2": 499.0, "r_x3": 50.11, "r_y3": 499.0, "coord_origin": "TOPLEFT" }, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 519.86, "r_x1": 286.37, "r_y1": 519.86, "r_x2": 286.37, "r_y2": 510.96, "r_x3": 50.11, "r_y3": 510.96, "coord_origin": "TOPLEFT" }, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 531.82, "r_x1": 286.37, "r_y1": 531.82, "r_x2": 286.37, "r_y2": 522.91, "r_x3": 50.11, "r_y3": 522.91, "coord_origin": "TOPLEFT" }, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 543.77, "r_x1": 286.37, "r_y1": 543.77, "r_x2": 286.37, "r_y2": 534.87, "r_x3": 50.11, "r_y3": 534.87, "coord_origin": "TOPLEFT" }, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 555.73, "r_x1": 286.37, "r_y1": 555.73, "r_x2": 286.37, "r_y2": 546.82, "r_x3": 50.11, "r_y3": 546.82, "coord_origin": "TOPLEFT" }, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 567.68, "r_x1": 257.47, "r_y1": 567.68, "r_x2": 257.47, "r_y2": 558.78, "r_x3": 50.11, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.95, "r_y0": 567.68, "r_x1": 286.37, "r_y1": 567.68, "r_x2": 286.37, "r_y2": 558.78, "r_x3": 263.95, "r_y3": 558.78, "coord_origin": "TOPLEFT" }, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 579.64, "r_x1": 286.37, "r_y1": 579.64, "r_x2": 286.37, "r_y2": 570.73, "r_x3": 50.11, "r_y3": 570.73, "coord_origin": "TOPLEFT" }, "text": "we have decided to simply discard those tables. In case of", "orig": "we have decided to simply discard those tables. In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 591.59, "r_x1": 286.37, "r_y1": 591.59, "r_x2": 286.37, "r_y2": 582.69, "r_x3": 50.11, "r_y3": 582.69, "coord_origin": "TOPLEFT" }, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 603.55, "r_x1": 286.37, "r_y1": 603.55, "r_x2": 286.37, "r_y2": 594.64, "r_x3": 50.11, "r_y3": 594.64, "coord_origin": "TOPLEFT" }, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 615.5, "r_x1": 286.37, "r_y1": 615.5, "r_x2": 286.37, "r_y2": 606.6, "r_x3": 50.11, "r_y3": 606.6, "coord_origin": "TOPLEFT" }, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 627.46, "r_x1": 242.26, "r_y1": 627.46, "r_x2": 242.26, "r_y2": 618.55, "r_x3": 50.11, "r_y3": 618.55, "coord_origin": "TOPLEFT" }, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes." }, { "label": "text", "id": 14, "page_no": 10, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 630.71, "r": 286.36, "b": 651.57, "coord_origin": "TOPLEFT" }, "confidence": 0.934, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 639.62, "r_x1": 286.36, "r_y1": 639.62, "r_x2": 286.36, "r_y2": 630.71, "r_x3": 62.07, "r_y3": 630.71, "coord_origin": "TOPLEFT" }, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 651.57, "r_x1": 179.9, "r_y1": 651.57, "r_x2": 179.9, "r_y2": 642.67, "r_x3": 50.11, "r_y3": 642.67, "coord_origin": "TOPLEFT" }, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset." }, { "label": "section_header", "id": 12, "page_no": 10, "cluster": { "id": 12, "label": "section_header", "bbox": { "l": 50.11, "t": 662.39, "r": 153.61, "b": 672.24, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 672.24, "r_x1": 64.3, "r_y1": 672.24, "r_x2": 64.3, "r_y2": 662.39, "r_x3": 50.11, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "1.2.", "orig": "1.2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.75, "r_y0": 672.24, "r_x1": 153.61, "r_y1": 672.24, "r_x2": 153.61, "r_y2": 662.39, "r_x3": 73.75, "r_y3": 662.39, "coord_origin": "TOPLEFT" }, "text": "Synthetic datasets", "orig": "Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1.2. Synthetic datasets" }, { "label": "text", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 681.33, "r": 286.37, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 690.24, "r_x1": 286.36, "r_y1": 690.24, "r_x2": 286.36, "r_y2": 681.33, "r_x3": 62.07, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 702.19, "r_x1": 286.37, "r_y1": 702.19, "r_x2": 286.37, "r_y2": 693.29, "r_x3": 50.11, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 714.15, "r_x1": 84.14, "r_y1": 714.15, "r_x2": 84.14, "r_y2": 705.24, "r_x3": 50.11, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 91.24, "r_y0": 714.15, "r_x1": 286.37, "r_y1": 714.15, "r_x2": 286.37, "r_y2": 705.24, "r_x3": 91.24, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-" }, { "label": "text", "id": 8, "page_no": 10, "cluster": { "id": 8, "label": "text", "bbox": { "l": 308.86, "t": 162.66, "r": 545.12, "b": 207.43, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 171.56, "r_x1": 545.12, "r_y1": 171.56, "r_x2": 545.12, "r_y2": 162.66, "r_x3": 308.86, "r_y3": 162.66, "coord_origin": "TOPLEFT" }, "text": "ances in regard to their size, structure, style and content.", "orig": "ances in regard to their size, structure, style and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 183.52, "r_x1": 545.12, "r_y1": 183.52, "r_x2": 545.12, "r_y2": 174.61, "r_x3": 308.86, "r_y3": 174.61, "coord_origin": "TOPLEFT" }, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 195.47, "r_x1": 545.12, "r_y1": 195.47, "r_x2": 545.12, "r_y2": 186.57, "r_x3": 308.86, "r_y3": 186.57, "coord_origin": "TOPLEFT" }, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 207.43, "r_x1": 484.07, "r_y1": 207.43, "r_x2": 484.07, "r_y2": 198.52, "r_x3": 308.86, "r_y3": 198.52, "coord_origin": "TOPLEFT" }, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)." }, { "label": "text", "id": 15, "page_no": 10, "cluster": { "id": 15, "label": "text", "bbox": { "l": 308.86, "t": 211.24, "r": 545.12, "b": 232.1, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 220.14, "r_x1": 545.12, "r_y1": 220.14, "r_x2": 545.12, "r_y2": 211.24, "r_x3": 320.82, "r_y3": 211.24, "coord_origin": "TOPLEFT" }, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 232.1, "r_x1": 448.09, "r_y1": 232.1, "r_x2": 448.09, "r_y2": 223.19, "r_x3": 308.86, "r_y3": 223.19, "coord_origin": "TOPLEFT" }, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:" }, { "label": "list_item", "id": 7, "page_no": 10, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 308.86, "t": 235.91, "r": 545.12, "b": 316.54, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 244.81, "r_x1": 328.29, "r_y1": 244.81, "r_x2": 328.29, "r_y2": 235.91, "r_x3": 320.82, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.38, "r_y0": 244.81, "r_x1": 545.11, "r_y1": 244.81, "r_x2": 545.11, "r_y2": 235.91, "r_x3": 335.38, "r_y3": 235.91, "coord_origin": "TOPLEFT" }, "text": "Prepare styling and content templates: The styling", "orig": "Prepare styling and content templates: The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 256.77, "r_x1": 545.12, "r_y1": 256.77, "r_x2": 545.12, "r_y2": 247.86, "r_x3": 308.86, "r_y3": 247.86, "coord_origin": "TOPLEFT" }, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 268.72, "r_x1": 545.12, "r_y1": 268.72, "r_x2": 545.12, "r_y2": 259.82, "r_x3": 308.86, "r_y3": 259.82, "coord_origin": "TOPLEFT" }, "text": "groups of scope specific appearances (e.g. financial data,", "orig": "groups of scope specific appearances (e.g. financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 280.68, "r_x1": 393.38, "r_y1": 280.68, "r_x2": 393.38, "r_y2": 271.77, "r_x3": 308.86, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 400.12, "r_y0": 280.68, "r_x1": 545.12, "r_y1": 280.68, "r_x2": 545.12, "r_y2": 271.77, "r_x3": 400.12, "r_y3": 271.77, "coord_origin": "TOPLEFT" }, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 292.63, "r_x1": 545.12, "r_y1": 292.63, "r_x2": 545.12, "r_y2": 283.73, "r_x3": 308.86, "r_y3": 283.73, "coord_origin": "TOPLEFT" }, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.59, "r_x1": 545.12, "r_y1": 304.59, "r_x2": 545.12, "r_y2": 295.68, "r_x3": 308.86, "r_y3": 295.68, "coord_origin": "TOPLEFT" }, "text": "frequently used terms out of non-synthetic datasets (e.g.", "orig": "frequently used terms out of non-synthetic datasets (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.54, "r_x1": 425.69, "r_y1": 316.54, "r_x2": 425.69, "r_y2": 307.64, "r_x3": 308.86, "r_y3": 307.64, "coord_origin": "TOPLEFT" }, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)." }, { "label": "list_item", "id": 6, "page_no": 10, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 320.35, "r": 545.12, "b": 448.81, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 329.26, "r_x1": 328.49, "r_y1": 329.26, "r_x2": 328.49, "r_y2": 320.35, "r_x3": 320.82, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.05, "r_y0": 329.26, "r_x1": 545.11, "r_y1": 329.26, "r_x2": 545.11, "r_y2": 320.35, "r_x3": 331.05, "r_y3": 320.35, "coord_origin": "TOPLEFT" }, "text": "Generate table structures: The structure of each syn-", "orig": "Generate table structures: The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 341.21, "r_x1": 545.12, "r_y1": 341.21, "r_x2": 545.12, "r_y2": 332.31, "r_x3": 308.86, "r_y3": 332.31, "coord_origin": "TOPLEFT" }, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 353.17, "r_x1": 545.12, "r_y1": 353.17, "r_x2": 545.12, "r_y2": 344.26, "r_x3": 308.86, "r_y3": 344.26, "coord_origin": "TOPLEFT" }, "text": "tentially spans over multiple rows and a table body that", "orig": "tentially spans over multiple rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 365.12, "r_x1": 545.12, "r_y1": 365.12, "r_x2": 545.12, "r_y2": 356.22, "r_x3": 308.86, "r_y3": 356.22, "coord_origin": "TOPLEFT" }, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 377.08, "r_x1": 545.12, "r_y1": 377.08, "r_x2": 545.12, "r_y2": 368.17, "r_x3": 308.86, "r_y3": 368.17, "coord_origin": "TOPLEFT" }, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 389.03, "r_x1": 545.11, "r_y1": 389.03, "r_x2": 545.11, "r_y2": 380.13, "r_x3": 308.86, "r_y3": 380.13, "coord_origin": "TOPLEFT" }, "text": "boundary. The table structure is described by the parame-", "orig": "boundary. The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 400.99, "r_x1": 545.12, "r_y1": 400.99, "r_x2": 545.12, "r_y2": 392.08, "r_x3": 308.86, "r_y3": 392.08, "coord_origin": "TOPLEFT" }, "text": "ters: Total number of table rows and columns, number of", "orig": "ters: Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.94, "r_x1": 545.12, "r_y1": 412.94, "r_x2": 545.12, "r_y2": 404.04, "r_x3": 308.86, "r_y3": 404.04, "coord_origin": "TOPLEFT" }, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.9, "r_x1": 545.11, "r_y1": 424.9, "r_x2": 545.11, "r_y2": 415.99, "r_x3": 308.86, "r_y3": 415.99, "coord_origin": "TOPLEFT" }, "text": "spans, column only spans, both row and column spans),", "orig": "spans, column only spans, both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.85, "r_x1": 545.12, "r_y1": 436.85, "r_x2": 545.12, "r_y2": 427.95, "r_x3": 308.86, "r_y3": 427.95, "coord_origin": "TOPLEFT" }, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.81, "r_x1": 345.94, "r_y1": 448.81, "r_x2": 345.94, "r_y2": 439.9, "r_x3": 308.86, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans." }, { "label": "list_item", "id": 9, "page_no": 10, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 452.62, "r": 545.12, "b": 497.39, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 461.52, "r_x1": 328.3, "r_y1": 461.52, "r_x2": 328.3, "r_y2": 452.62, "r_x3": 320.82, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.8, "r_y0": 461.52, "r_x1": 485.76, "r_y1": 461.52, "r_x2": 485.76, "r_y2": 452.62, "r_x3": 330.8, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": "Generate content: Based on the dataset", "orig": "Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.07, "r_y0": 461.29, "r_x1": 511.86, "r_y1": 461.29, "r_x2": 511.86, "r_y2": 452.71, "r_x3": 488.07, "r_y3": 452.71, "coord_origin": "TOPLEFT" }, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 511.86, "r_y0": 461.52, "r_x1": 545.11, "r_y1": 461.52, "r_x2": 545.11, "r_y2": 452.62, "r_x3": 511.86, "r_y3": 452.62, "coord_origin": "TOPLEFT" }, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 473.48, "r_x1": 545.12, "r_y1": 473.48, "r_x2": 545.12, "r_y2": 464.57, "r_x3": 308.86, "r_y3": 464.57, "coord_origin": "TOPLEFT" }, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 485.43, "r_x1": 545.12, "r_y1": 485.43, "r_x2": 545.12, "r_y2": 476.53, "r_x3": 308.86, "r_y3": 476.53, "coord_origin": "TOPLEFT" }, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 497.39, "r_x1": 379.15, "r_y1": 497.39, "r_x2": 379.15, "r_y2": 488.48, "r_x3": 308.86, "r_y3": 488.48, "coord_origin": "TOPLEFT" }, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content." }, { "label": "list_item", "id": 5, "page_no": 10, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 308.86, "t": 501.2, "r": 545.12, "b": 545.97, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 510.1, "r_x1": 328.66, "r_y1": 510.1, "r_x2": 328.66, "r_y2": 501.2, "r_x3": 320.82, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.28, "r_y0": 510.1, "r_x1": 545.11, "r_y1": 510.1, "r_x2": 545.11, "r_y2": 501.2, "r_x3": 331.28, "r_y3": 501.2, "coord_origin": "TOPLEFT" }, "text": "Apply styling templates: Depending on the domain", "orig": "Apply styling templates: Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 522.06, "r_x1": 545.12, "r_y1": 522.06, "r_x2": 545.12, "r_y2": 513.15, "r_x3": 308.86, "r_y3": 513.15, "coord_origin": "TOPLEFT" }, "text": "of the synthetic dataset, a set of styling templates is first", "orig": "of the synthetic dataset, a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 534.01, "r_x1": 384.3, "r_y1": 534.01, "r_x2": 384.3, "r_y2": 525.11, "r_x3": 308.86, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.25, "r_y0": 534.01, "r_x1": 545.12, "r_y1": 534.01, "r_x2": 545.12, "r_y2": 525.11, "r_x3": 391.25, "r_y3": 525.11, "coord_origin": "TOPLEFT" }, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 545.97, "r_x1": 496.16, "r_y1": 545.97, "r_x2": 496.16, "r_y2": 537.06, "r_x3": 308.86, "r_y3": 537.06, "coord_origin": "TOPLEFT" }, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table." }, { "label": "list_item", "id": 4, "page_no": 10, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 308.86, "t": 549.78, "r": 545.12, "b": 606.5, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 558.68, "r_x1": 328.29, "r_y1": 558.68, "r_x2": 328.29, "r_y2": 549.78, "r_x3": 320.82, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.4, "r_y0": 558.68, "r_x1": 545.11, "r_y1": 558.68, "r_x2": 545.11, "r_y2": 549.78, "r_x3": 335.4, "r_y3": 549.78, "coord_origin": "TOPLEFT" }, "text": "Render the complete tables: The synthetic table is", "orig": "Render the complete tables: The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 570.64, "r_x1": 545.12, "r_y1": 570.64, "r_x2": 545.12, "r_y2": 561.73, "r_x3": 308.86, "r_y3": 561.73, "coord_origin": "TOPLEFT" }, "text": "finally rendered by a web browser engine to generate the", "orig": "finally rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 582.59, "r_x1": 545.12, "r_y1": 582.59, "r_x2": 545.12, "r_y2": 573.69, "r_x3": 308.86, "r_y3": 573.69, "coord_origin": "TOPLEFT" }, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 594.55, "r_x1": 545.12, "r_y1": 594.55, "r_x2": 545.12, "r_y2": 585.64, "r_x3": 308.86, "r_y3": 585.64, "coord_origin": "TOPLEFT" }, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 606.5, "r_x1": 341.23, "r_y1": 606.5, "r_x2": 341.23, "r_y2": 597.6, "r_x3": 308.86, "r_y3": 597.6, "coord_origin": "TOPLEFT" }, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process." }, { "label": "section_header", "id": 10, "page_no": 10, "cluster": { "id": 10, "label": "section_header", "bbox": { "l": 308.86, "t": 622.29, "r": 545.11, "b": 646.99, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 633.04, "r_x1": 316.77, "r_y1": 633.04, "r_x2": 316.77, "r_y2": 622.29, "r_x3": 308.86, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.31, "r_y0": 633.04, "r_x1": 545.11, "r_y1": 633.04, "r_x2": 545.11, "r_y2": 622.29, "r_x3": 327.31, "r_y3": 622.29, "coord_origin": "TOPLEFT" }, "text": "Prediction post-processing for PDF docu-", "orig": "Prediction post-processing for PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.8, "r_y0": 646.99, "r_x1": 357.34, "r_y1": 646.99, "r_x2": 357.34, "r_y2": 636.24, "r_x3": 326.8, "r_y3": 636.24, "coord_origin": "TOPLEFT" }, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Prediction post-processing for PDF documents" }, { "label": "text", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "text", "bbox": { "l": 308.86, "t": 657.42, "r": 545.12, "b": 714.15, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 666.33, "r_x1": 545.11, "r_y1": 666.33, "r_x2": 545.11, "r_y2": 657.42, "r_x3": 320.82, "r_y3": 657.42, "coord_origin": "TOPLEFT" }, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 678.28, "r_x1": 545.12, "r_y1": 678.28, "r_x2": 545.12, "r_y2": 669.38, "r_x3": 308.86, "r_y3": 669.38, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 690.24, "r_x1": 545.12, "r_y1": 690.24, "r_x2": 545.12, "r_y2": 681.33, "r_x3": 308.86, "r_y3": 681.33, "coord_origin": "TOPLEFT" }, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 702.19, "r_x1": 545.12, "r_y1": 702.19, "r_x2": 545.12, "r_y2": 693.29, "r_x3": 308.86, "r_y3": 693.29, "coord_origin": "TOPLEFT" }, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 714.15, "r_x1": 371.43, "r_y1": 714.15, "r_x2": 371.43, "r_y2": 705.24, "r_x3": 308.86, "r_y3": 705.24, "coord_origin": "TOPLEFT" }, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:" } ], "headers": [ { "label": "page_footer", "id": 16, "page_no": 10, "cluster": { "id": 16, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.899, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ] } }, { "page_no": 11, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 174.41, "r_x1": 545.11, "r_y1": 174.41, "r_x2": 545.11, "r_y2": 165.5, "r_x3": 50.11, "r_y3": 165.5, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 186.36, "r_x1": 513.52, "r_y1": 186.36, "r_x2": 513.52, "r_y2": 177.46, "r_x3": 50.11, "r_y3": 177.46, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 219.84, "r_x1": 71.15, "r_y1": 219.84, "r_x2": 71.15, "r_y2": 210.93, "r_x3": 61.57, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.54, "r_y0": 219.84, "r_x1": 286.37, "r_y1": 219.84, "r_x2": 286.37, "r_y2": 210.93, "r_x3": 73.54, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 231.79, "r_x1": 87.47, "r_y1": 231.79, "r_x2": 87.47, "r_y2": 222.89, "r_x3": 70.04, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 252.98, "r_x1": 71.35, "r_y1": 252.98, "r_x2": 71.35, "r_y2": 244.07, "r_x3": 61.57, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.79, "r_y0": 252.98, "r_x1": 286.37, "r_y1": 252.98, "r_x2": 286.37, "r_y2": 244.07, "r_x3": 73.79, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 264.93, "r_x1": 150.42, "r_y1": 264.93, "r_x2": 150.42, "r_y2": 256.03, "r_x3": 70.04, "r_y3": 256.03, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 288.11, "r_x1": 286.36, "r_y1": 288.11, "r_x2": 286.36, "r_y2": 279.2, "r_x3": 62.07, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.06, "r_x1": 286.37, "r_y1": 300.06, "r_x2": 286.37, "r_y2": 291.16, "r_x3": 50.11, "r_y3": 291.16, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.02, "r_x1": 286.37, "r_y1": 312.02, "r_x2": 286.37, "r_y2": 303.11, "r_x3": 50.11, "r_y3": 303.11, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.97, "r_x1": 286.37, "r_y1": 323.97, "r_x2": 286.37, "r_y2": 315.07, "r_x3": 50.11, "r_y3": 315.07, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.93, "r_x1": 286.37, "r_y1": 335.93, "r_x2": 286.37, "r_y2": 327.02, "r_x3": 50.11, "r_y3": 327.02, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.89, "r_x1": 286.37, "r_y1": 347.89, "r_x2": 286.37, "r_y2": 338.98, "r_x3": 50.11, "r_y3": 338.98, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.84, "r_x1": 286.37, "r_y1": 359.84, "r_x2": 286.37, "r_y2": 350.93, "r_x3": 50.11, "r_y3": 350.93, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.8, "r_x1": 286.37, "r_y1": 371.8, "r_x2": 286.37, "r_y2": 362.89, "r_x3": 50.11, "r_y3": 362.89, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.75, "r_x1": 286.37, "r_y1": 383.75, "r_x2": 286.37, "r_y2": 374.84, "r_x3": 50.11, "r_y3": 374.84, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.71, "r_x1": 154.56, "r_y1": 395.71, "r_x2": 154.56, "r_y2": 386.8, "r_x3": 50.11, "r_y3": 386.8, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 407.98, "r_x1": 286.36, "r_y1": 407.98, "r_x2": 286.36, "r_y2": 399.07, "r_x3": 62.07, "r_y3": 399.07, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 419.93, "r_x1": 95.49, "r_y1": 419.93, "r_x2": 95.49, "r_y2": 411.03, "r_x3": 50.11, "r_y3": 411.03, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 432.2, "r_x1": 69.37, "r_y1": 432.2, "r_x2": 69.37, "r_y2": 423.3, "r_x3": 62.07, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.81, "r_y0": 432.2, "r_x1": 286.37, "r_y1": 432.2, "r_x2": 286.37, "r_y2": 423.3, "r_x3": 71.81, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.16, "r_x1": 286.37, "r_y1": 444.16, "r_x2": 286.37, "r_y2": 435.25, "r_x3": 50.11, "r_y3": 435.25, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 456.11, "r_x1": 274.51, "r_y1": 456.11, "r_x2": 274.51, "r_y2": 447.21, "r_x3": 50.11, "r_y3": 447.21, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 468.38, "r_x1": 69.54, "r_y1": 468.38, "r_x2": 69.54, "r_y2": 459.48, "r_x3": 62.07, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.43, "r_y0": 468.38, "r_x1": 286.36, "r_y1": 468.38, "r_x2": 286.36, "r_y2": 459.48, "r_x3": 77.43, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 480.34, "r_x1": 286.37, "r_y1": 480.34, "r_x2": 286.37, "r_y2": 471.43, "r_x3": 50.11, "r_y3": 471.43, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.29, "r_x1": 286.37, "r_y1": 492.29, "r_x2": 286.37, "r_y2": 483.39, "r_x3": 50.11, "r_y3": 483.39, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 504.25, "r_x1": 110.7, "r_y1": 504.25, "r_x2": 110.7, "r_y2": 495.34, "r_x3": 50.11, "r_y3": 495.34, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 516.52, "r_x1": 69.86, "r_y1": 516.52, "r_x2": 69.86, "r_y2": 507.61, "r_x3": 62.07, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.46, "r_y0": 516.52, "r_x1": 286.36, "r_y1": 516.52, "r_x2": 286.36, "r_y2": 507.61, "r_x3": 72.46, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 528.47, "r_x1": 226.07, "r_y1": 528.47, "r_x2": 226.07, "r_y2": 519.57, "r_x3": 50.11, "r_y3": 519.57, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 540.74, "r_x1": 286.36, "r_y1": 540.74, "r_x2": 286.36, "r_y2": 531.84, "r_x3": 62.07, "r_y3": 531.84, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 552.7, "r_x1": 286.37, "r_y1": 552.7, "r_x2": 286.37, "r_y2": 543.79, "r_x3": 50.11, "r_y3": 543.79, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 564.65, "r_x1": 114.03, "r_y1": 564.65, "r_x2": 114.03, "r_y2": 555.75, "r_x3": 50.11, "r_y3": 555.75, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 576.92, "r_x1": 69.54, "r_y1": 576.92, "r_x2": 69.54, "r_y2": 568.02, "r_x3": 62.07, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.73, "r_y0": 576.92, "r_x1": 286.37, "r_y1": 576.92, "r_x2": 286.37, "r_y2": 568.02, "r_x3": 76.73, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 588.88, "r_x1": 286.37, "r_y1": 588.88, "r_x2": 286.37, "r_y2": 579.97, "r_x3": 50.11, "r_y3": 579.97, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 600.83, "r_x1": 278.7, "r_y1": 600.83, "r_x2": 278.7, "r_y2": 591.93, "r_x3": 50.11, "r_y3": 591.93, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.03, "r_y0": 632.84, "r_x1": 157.95, "r_y1": 632.84, "r_x2": 157.95, "r_y2": 623.99, "r_x3": 112.03, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.72, "r_y0": 632.84, "r_x1": 203.5, "r_y1": 632.84, "r_x2": 203.5, "r_y2": 623.99, "r_x3": 160.72, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 640.18, "r_x1": 189.15, "r_y1": 640.18, "r_x2": 189.15, "r_y2": 633.98, "r_x3": 185.58, "r_y3": 633.98, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.5, "r_y0": 632.84, "r_x1": 208.48, "r_y1": 632.84, "r_x2": 208.48, "r_y2": 623.44, "r_x3": 203.5, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48, "r_y0": 632.84, "r_x1": 220.29, "r_y1": 632.84, "r_x2": 220.29, "r_y2": 623.99, "r_x3": 208.48, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 632.84, "r_x1": 225.77, "r_y1": 632.84, "r_x2": 225.77, "r_y2": 623.44, "r_x3": 220.79, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.7, "r_y0": 654.11, "r_x1": 122.51, "r_y1": 654.11, "r_x2": 122.51, "r_y2": 645.26, "r_x3": 110.7, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.78, "r_y0": 654.11, "r_x1": 133.53, "r_y1": 654.11, "r_x2": 133.53, "r_y2": 645.26, "r_x3": 125.78, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.29, "r_y0": 654.11, "r_x1": 156.0, "r_y1": 654.11, "r_x2": 156.0, "r_y2": 645.26, "r_x3": 136.29, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.0, "r_y0": 654.11, "r_x1": 160.98, "r_y1": 654.11, "r_x2": 160.98, "r_y2": 644.7, "r_x3": 156.0, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98, "r_y0": 654.11, "r_x1": 170.24, "r_y1": 654.11, "r_x2": 170.24, "r_y2": 645.26, "r_x3": 160.98, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.74, "r_y0": 654.11, "r_x1": 185.68, "r_y1": 654.11, "r_x2": 185.68, "r_y2": 644.7, "r_x3": 170.74, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.89, "r_y0": 654.11, "r_x1": 206.05, "r_y1": 654.11, "r_x2": 206.05, "r_y2": 645.26, "r_x3": 187.89, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.05, "r_y0": 654.11, "r_x1": 211.04, "r_y1": 654.11, "r_x2": 211.04, "r_y2": 644.7, "r_x3": 206.05, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.03, "r_y0": 654.11, "r_x1": 220.29, "r_y1": 654.11, "r_x2": 220.29, "r_y2": 645.26, "r_x3": 211.03, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 654.11, "r_x1": 225.77, "r_y1": 654.11, "r_x2": 225.77, "r_y2": 644.7, "r_x3": 220.79, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 643.79, "r_x1": 286.36, "r_y1": 643.79, "r_x2": 286.36, "r_y2": 634.89, "r_x3": 274.75, "r_y3": 634.89, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 676.97, "r_x1": 74.45, "r_y1": 676.97, "r_x2": 74.45, "r_y2": 668.07, "r_x3": 50.11, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.34, "r_y0": 676.75, "r_x1": 82.65, "r_y1": 676.75, "r_x2": 82.65, "r_y2": 667.91, "r_x3": 78.34, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.53, "r_y0": 676.97, "r_x1": 123.63, "r_y1": 676.97, "r_x2": 123.63, "r_y2": 668.07, "r_x3": 86.53, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.52, "r_y0": 676.75, "r_x1": 132.5, "r_y1": 676.75, "r_x2": 132.5, "r_y2": 667.35, "r_x3": 127.52, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.5, "r_y0": 676.97, "r_x1": 210.7, "r_y1": 676.97, "r_x2": 210.7, "r_y2": 668.07, "r_x3": 132.5, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.7, "r_y0": 676.75, "r_x1": 215.68, "r_y1": 676.75, "r_x2": 215.68, "r_y2": 667.35, "r_x3": 210.7, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56, "r_y0": 676.97, "r_x1": 233.95, "r_y1": 676.97, "r_x2": 233.95, "r_y2": 668.07, "r_x3": 219.56, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83, "r_y0": 676.75, "r_x1": 247.09, "r_y1": 676.75, "r_x2": 247.09, "r_y2": 667.91, "r_x3": 237.83, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47, "r_y0": 676.97, "r_x1": 286.36, "r_y1": 676.97, "r_x2": 286.36, "r_y2": 668.07, "r_x3": 251.47, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 688.93, "r_x1": 205.89, "r_y1": 688.93, "r_x2": 205.89, "r_y2": 680.02, "r_x3": 50.11, "r_y3": 680.02, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 701.2, "r_x1": 69.54, "r_y1": 701.2, "r_x2": 69.54, "r_y2": 692.29, "r_x3": 62.07, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.27, "r_y0": 701.2, "r_x1": 286.36, "r_y1": 701.2, "r_x2": 286.36, "r_y2": 692.29, "r_x3": 76.27, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 94.6, "r_y1": 713.15, "r_x2": 94.6, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.6, "r_y0": 712.93, "r_x1": 103.29, "r_y1": 712.93, "r_x2": 103.29, "r_y2": 704.09, "r_x3": 97.6, "r_y3": 704.09, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.29, "r_y0": 713.15, "r_x1": 286.36, "r_y1": 713.15, "r_x2": 286.36, "r_y2": 704.25, "r_x3": 103.29, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 219.84, "r_x1": 545.12, "r_y1": 219.84, "r_x2": 545.12, "r_y2": 210.93, "r_x3": 308.86, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 231.79, "r_x1": 545.12, "r_y1": 231.79, "r_x2": 545.12, "r_y2": 222.89, "r_x3": 308.86, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 243.75, "r_x1": 545.12, "r_y1": 243.75, "r_x2": 545.12, "r_y2": 234.84, "r_x3": 308.86, "r_y3": 234.84, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 255.7, "r_x1": 339.58, "r_y1": 255.7, "r_x2": 339.58, "r_y2": 246.8, "r_x3": 308.86, "r_y3": 246.8, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 268.01, "r_x1": 328.29, "r_y1": 268.01, "r_x2": 328.29, "r_y2": 259.1, "r_x3": 320.82, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88, "r_y0": 268.01, "r_x1": 545.11, "r_y1": 268.01, "r_x2": 545.11, "r_y2": 259.1, "r_x3": 334.88, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 279.96, "r_x1": 338.19, "r_y1": 279.96, "r_x2": 338.19, "r_y2": 271.06, "r_x3": 308.86, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68, "r_y0": 279.74, "r_x1": 346.38, "r_y1": 279.74, "r_x2": 346.38, "r_y2": 270.9, "r_x3": 340.68, "r_y3": 270.9, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.38, "r_y0": 279.96, "r_x1": 453.72, "r_y1": 279.96, "r_x2": 453.72, "r_y2": 271.06, "r_x3": 346.38, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 292.27, "r_x1": 328.39, "r_y1": 292.27, "r_x2": 328.39, "r_y2": 283.36, "r_x3": 320.82, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.91, "r_y0": 292.27, "r_x1": 545.11, "r_y1": 292.27, "r_x2": 545.11, "r_y2": 283.36, "r_x3": 330.91, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.22, "r_x1": 545.12, "r_y1": 304.22, "r_x2": 545.12, "r_y2": 295.32, "r_x3": 308.86, "r_y3": 295.32, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.18, "r_x1": 545.12, "r_y1": 316.18, "r_x2": 545.12, "r_y2": 307.27, "r_x3": 308.86, "r_y3": 307.27, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.13, "r_x1": 545.12, "r_y1": 328.13, "r_x2": 545.12, "r_y2": 319.23, "r_x3": 308.86, "r_y3": 319.23, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 340.09, "r_x1": 397.19, "r_y1": 340.09, "r_x2": 397.19, "r_y2": 331.18, "r_x3": 308.86, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.66, "r_y0": 340.09, "r_x1": 545.12, "r_y1": 340.09, "r_x2": 545.12, "r_y2": 331.18, "r_x3": 403.66, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.05, "r_x1": 545.12, "r_y1": 352.05, "r_x2": 545.12, "r_y2": 343.14, "r_x3": 308.86, "r_y3": 343.14, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.0, "r_x1": 545.12, "r_y1": 364.0, "r_x2": 545.12, "r_y2": 355.09, "r_x3": 308.86, "r_y3": 355.09, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 375.96, "r_x1": 545.12, "r_y1": 375.96, "r_x2": 545.12, "r_y2": 367.05, "r_x3": 308.86, "r_y3": 367.05, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 387.91, "r_x1": 329.61, "r_y1": 387.91, "r_x2": 329.61, "r_y2": 379.0, "r_x3": 308.86, "r_y3": 379.0, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 400.22, "r_x1": 328.55, "r_y1": 400.22, "r_x2": 328.55, "r_y2": 391.31, "r_x3": 320.82, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13, "r_y0": 400.22, "r_x1": 545.12, "r_y1": 400.22, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 331.13, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.27, "r_x3": 308.86, "r_y3": 403.27, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.13, "r_x1": 545.12, "r_y1": 424.13, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.18, "r_x3": 308.86, "r_y3": 427.18, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.04, "r_x1": 545.12, "r_y1": 448.04, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 426.18, "r_y1": 459.99, "r_x2": 426.18, "r_y2": 451.09, "r_x3": 308.86, "r_y3": 451.09, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 472.3, "r_x1": 328.67, "r_y1": 472.3, "r_x2": 328.67, "r_y2": 463.39, "r_x3": 320.82, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29, "r_y0": 472.3, "r_x1": 545.11, "r_y1": 472.3, "r_x2": 545.11, "r_y2": 463.39, "r_x3": 331.29, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.25, "r_x1": 545.12, "r_y1": 484.25, "r_x2": 545.12, "r_y2": 475.35, "r_x3": 308.86, "r_y3": 475.35, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.21, "r_x1": 545.12, "r_y1": 496.21, "r_x2": 545.12, "r_y2": 487.3, "r_x3": 308.86, "r_y3": 487.3, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.16, "r_x1": 381.9, "r_y1": 508.16, "r_x2": 381.9, "r_y2": 499.26, "r_x3": 308.86, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 508.16, "r_x1": 545.12, "r_y1": 508.16, "r_x2": 545.12, "r_y2": 499.26, "r_x3": 388.7, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.12, "r_x1": 545.12, "r_y1": 520.12, "r_x2": 545.12, "r_y2": 511.21, "r_x3": 308.86, "r_y3": 511.21, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 532.07, "r_x1": 545.12, "r_y1": 532.07, "r_x2": 545.12, "r_y2": 523.17, "r_x3": 308.86, "r_y3": 523.17, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 544.03, "r_x1": 545.11, "r_y1": 544.03, "r_x2": 545.11, "r_y2": 535.12, "r_x3": 308.86, "r_y3": 535.12, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.98, "r_x1": 545.12, "r_y1": 555.98, "r_x2": 545.12, "r_y2": 547.08, "r_x3": 308.86, "r_y3": 547.08, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.94, "r_x1": 442.22, "r_y1": 567.94, "r_x2": 442.22, "r_y2": 559.03, "r_x3": 308.86, "r_y3": 559.03, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 580.24, "r_x1": 545.11, "r_y1": 580.24, "r_x2": 545.11, "r_y2": 571.34, "r_x3": 320.82, "r_y3": 571.34, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 592.2, "r_x1": 471.64, "r_y1": 592.2, "r_x2": 471.64, "r_y2": 583.29, "r_x3": 308.86, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83, "r_y0": 591.98, "r_x1": 479.72, "r_y1": 591.98, "r_x2": 479.72, "r_y2": 583.13, "r_x3": 474.83, "r_y3": 583.13, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.27, "r_y0": 592.2, "r_x1": 545.12, "r_y1": 592.2, "r_x2": 545.12, "r_y2": 583.29, "r_x3": 483.27, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 604.15, "r_x1": 329.91, "r_y1": 604.15, "r_x2": 329.91, "r_y2": 595.25, "r_x3": 308.86, "r_y3": 595.25, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 616.46, "r_x1": 332.87, "r_y1": 616.46, "r_x2": 332.87, "r_y2": 607.55, "r_x3": 320.82, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93, "r_y0": 616.46, "r_x1": 545.12, "r_y1": 616.46, "r_x2": 545.12, "r_y2": 607.55, "r_x3": 339.93, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 628.42, "r_x1": 495.29, "r_y1": 628.42, "r_x2": 495.29, "r_y2": 619.51, "r_x3": 308.86, "r_y3": 619.51, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 640.72, "r_x1": 545.12, "r_y1": 640.72, "r_x2": 545.12, "r_y2": 631.81, "r_x3": 320.82, "r_y3": 631.81, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 652.68, "r_x1": 455.28, "r_y1": 652.68, "r_x2": 455.28, "r_y2": 643.77, "r_x3": 308.86, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.78, "r_y0": 652.46, "r_x1": 463.47, "r_y1": 652.46, "r_x2": 463.47, "r_y2": 643.61, "r_x3": 457.78, "r_y3": 643.61, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97, "r_y0": 652.68, "r_x1": 545.11, "r_y1": 652.68, "r_x2": 545.11, "r_y2": 643.77, "r_x3": 465.97, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 664.63, "r_x1": 332.38, "r_y1": 664.63, "r_x2": 332.38, "r_y2": 655.72, "r_x3": 308.86, "r_y3": 655.72, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 676.94, "r_x1": 545.11, "r_y1": 676.94, "r_x2": 545.11, "r_y2": 668.03, "r_x3": 320.82, "r_y3": 668.03, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 688.89, "r_x1": 510.58, "r_y1": 688.89, "r_x2": 510.58, "r_y2": 679.99, "r_x3": 308.86, "r_y3": 679.99, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 320.82, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 30, "label": "picture", "bbox": { "l": 53.54, "t": 74.75, "r": 544.94, "b": 147.59, "coord_origin": "TOPLEFT" }, "confidence": 0.603, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39, "t": 77.31, "r": 151.95, "b": 83.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.35, "t": 75.19, "r": 59.33, "b": 81.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.58, "t": 77.46, "r": 319.83, "b": 83.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37, "t": 77.25, "r": 481.76, "b": 83.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.55, "t": 141.28, "r": 94.98, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.04, "t": 101.1, "r": 85.29, "b": 106.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.77, "t": 124.4, "r": 85.23, "b": 129.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55, "t": 102.54, "r": 249.8, "b": 107.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.2, "t": 126.99, "r": 249.66, "b": 131.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.23, "t": 114.05, "r": 413.7, "b": 119.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.38, "t": 141.28, "r": 105.08, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.94, "t": 85.73, "r": 76.15, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.3, "t": 86.22, "r": 106.99, "b": 91.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.21, "t": 141.61, "r": 281.88, "b": 146.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.7, "t": 85.73, "r": 241.91, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.94, "t": 86.09, "r": 282.49, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19, "t": 141.28, "r": 444.69, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37, "t": 85.73, "r": 432.67, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.61, "t": 86.26, "r": 445.62, "b": 91.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.95, "t": 141.29, "r": 136.2, "b": 146.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.92, "t": 94.82, "r": 127.05, "b": 99.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.31, "t": 100.94, "r": 127.05, "b": 105.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94, "t": 107.06, "r": 127.06, "b": 112.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.23, "t": 122.62, "r": 126.97, "b": 127.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85, "t": 128.74, "r": 126.97, "b": 133.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.58, "t": 141.44, "r": 156.04, "b": 146.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03, "t": 86.27, "r": 151.04, "b": 91.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65, "t": 86.55, "r": 321.67, "b": 91.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89, "t": 141.71, "r": 310.15, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.24, "t": 93.08, "r": 299.37, "b": 98.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.64, "t": 99.2, "r": 299.37, "b": 104.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26, "t": 105.32, "r": 299.38, "b": 110.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43, "t": 120.39, "r": 299.17, "b": 125.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.06, "t": 126.51, "r": 299.17, "b": 131.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.35, "t": 141.71, "r": 328.81, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58, "t": 86.69, "r": 309.6, "b": 91.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04, "t": 141.67, "r": 483.5, "b": 146.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02, "t": 93.76, "r": 469.16, "b": 98.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.42, "t": 99.88, "r": 469.16, "b": 104.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.05, "t": 106.0, "r": 469.16, "b": 110.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39, "t": 85.57, "r": 480.65, "b": 90.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.38, "t": 141.58, "r": 182.63, "b": 146.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74, "t": 94.86, "r": 173.33, "b": 99.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.51, "t": 100.98, "r": 173.32, "b": 105.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27, "t": 107.1, "r": 173.33, "b": 112.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41, "t": 107.23, "r": 346.0, "b": 112.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.18, "t": 113.35, "r": 345.99, "b": 118.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94, "t": 119.47, "r": 346.0, "b": 124.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.99, "t": 104.15, "r": 508.76, "b": 109.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.19, "t": 110.27, "r": 508.76, "b": 115.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72, "t": 116.39, "r": 508.77, "b": 121.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71, "t": 122.51, "r": 508.77, "b": 127.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.38, "t": 141.71, "r": 202.84, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.5, "t": 86.14, "r": 197.53, "b": 91.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.38, "t": 86.0, "r": 367.4, "b": 90.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73, "t": 141.62, "r": 374.93, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69, "t": 86.06, "r": 355.71, "b": 91.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54, "t": 141.38, "r": 526.01, "b": 146.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.45, "t": 86.09, "r": 523.71, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 1, "label": "caption", "bbox": { "l": 50.11, "t": 165.5, "r": 545.11, "b": 186.36, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 174.41, "r_x1": 545.11, "r_y1": 174.41, "r_x2": 545.11, "r_y2": 165.5, "r_x3": 50.11, "r_y3": 165.5, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 186.36, "r_x1": 513.52, "r_y1": 186.36, "r_x2": 513.52, "r_y2": 177.46, "r_x3": 50.11, "r_y3": 177.46, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 61.57, "t": 210.93, "r": 286.37, "b": 231.79, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 219.84, "r_x1": 71.15, "r_y1": 219.84, "r_x2": 71.15, "r_y2": 210.93, "r_x3": 61.57, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.54, "r_y0": 219.84, "r_x1": 286.37, "r_y1": 219.84, "r_x2": 286.37, "r_y2": 210.93, "r_x3": 73.54, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 231.79, "r_x1": 87.47, "r_y1": 231.79, "r_x2": 87.47, "r_y2": 222.89, "r_x3": 70.04, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 61.57, "t": 244.07, "r": 286.37, "b": 264.93, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 252.98, "r_x1": 71.35, "r_y1": 252.98, "r_x2": 71.35, "r_y2": 244.07, "r_x3": 61.57, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.79, "r_y0": 252.98, "r_x1": 286.37, "r_y1": 252.98, "r_x2": 286.37, "r_y2": 244.07, "r_x3": 73.79, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 264.93, "r_x1": 150.42, "r_y1": 264.93, "r_x2": 150.42, "r_y2": 256.03, "r_x3": 70.04, "r_y3": 256.03, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 279.2, "r": 286.37, "b": 395.71, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 288.11, "r_x1": 286.36, "r_y1": 288.11, "r_x2": 286.36, "r_y2": 279.2, "r_x3": 62.07, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.06, "r_x1": 286.37, "r_y1": 300.06, "r_x2": 286.37, "r_y2": 291.16, "r_x3": 50.11, "r_y3": 291.16, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.02, "r_x1": 286.37, "r_y1": 312.02, "r_x2": 286.37, "r_y2": 303.11, "r_x3": 50.11, "r_y3": 303.11, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.97, "r_x1": 286.37, "r_y1": 323.97, "r_x2": 286.37, "r_y2": 315.07, "r_x3": 50.11, "r_y3": 315.07, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.93, "r_x1": 286.37, "r_y1": 335.93, "r_x2": 286.37, "r_y2": 327.02, "r_x3": 50.11, "r_y3": 327.02, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.89, "r_x1": 286.37, "r_y1": 347.89, "r_x2": 286.37, "r_y2": 338.98, "r_x3": 50.11, "r_y3": 338.98, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.84, "r_x1": 286.37, "r_y1": 359.84, "r_x2": 286.37, "r_y2": 350.93, "r_x3": 50.11, "r_y3": 350.93, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.8, "r_x1": 286.37, "r_y1": 371.8, "r_x2": 286.37, "r_y2": 362.89, "r_x3": 50.11, "r_y3": 362.89, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.75, "r_x1": 286.37, "r_y1": 383.75, "r_x2": 286.37, "r_y2": 374.84, "r_x3": 50.11, "r_y3": 374.84, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.71, "r_x1": 154.56, "r_y1": 395.71, "r_x2": 154.56, "r_y2": 386.8, "r_x3": 50.11, "r_y3": 386.8, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 399.07, "r": 286.36, "b": 419.93, "coord_origin": "TOPLEFT" }, "confidence": 0.935, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 407.98, "r_x1": 286.36, "r_y1": 407.98, "r_x2": 286.36, "r_y2": 399.07, "r_x3": 62.07, "r_y3": 399.07, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 419.93, "r_x1": 95.49, "r_y1": 419.93, "r_x2": 95.49, "r_y2": 411.03, "r_x3": 50.11, "r_y3": 411.03, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "list_item", "bbox": { "l": 50.11, "t": 423.3, "r": 286.37, "b": 456.11, "coord_origin": "TOPLEFT" }, "confidence": 0.828, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 432.2, "r_x1": 69.37, "r_y1": 432.2, "r_x2": 69.37, "r_y2": 423.3, "r_x3": 62.07, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.81, "r_y0": 432.2, "r_x1": 286.37, "r_y1": 432.2, "r_x2": 286.37, "r_y2": 423.3, "r_x3": 71.81, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.16, "r_x1": 286.37, "r_y1": 444.16, "r_x2": 286.37, "r_y2": 435.25, "r_x3": 50.11, "r_y3": 435.25, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 456.11, "r_x1": 274.51, "r_y1": 456.11, "r_x2": 274.51, "r_y2": 447.21, "r_x3": 50.11, "r_y3": 447.21, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 459.48, "r": 286.37, "b": 504.25, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 468.38, "r_x1": 69.54, "r_y1": 468.38, "r_x2": 69.54, "r_y2": 459.48, "r_x3": 62.07, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.43, "r_y0": 468.38, "r_x1": 286.36, "r_y1": 468.38, "r_x2": 286.36, "r_y2": 459.48, "r_x3": 77.43, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 480.34, "r_x1": 286.37, "r_y1": 480.34, "r_x2": 286.37, "r_y2": 471.43, "r_x3": 50.11, "r_y3": 471.43, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.29, "r_x1": 286.37, "r_y1": 492.29, "r_x2": 286.37, "r_y2": 483.39, "r_x3": 50.11, "r_y3": 483.39, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 504.25, "r_x1": 110.7, "r_y1": 504.25, "r_x2": 110.7, "r_y2": 495.34, "r_x3": 50.11, "r_y3": 495.34, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 507.61, "r": 286.36, "b": 528.47, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 516.52, "r_x1": 69.86, "r_y1": 516.52, "r_x2": 69.86, "r_y2": 507.61, "r_x3": 62.07, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.46, "r_y0": 516.52, "r_x1": 286.36, "r_y1": 516.52, "r_x2": 286.36, "r_y2": 507.61, "r_x3": 72.46, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 528.47, "r_x1": 226.07, "r_y1": 528.47, "r_x2": 226.07, "r_y2": 519.57, "r_x3": 50.11, "r_y3": 519.57, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 531.84, "r": 286.37, "b": 564.65, "coord_origin": "TOPLEFT" }, "confidence": 0.949, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 540.74, "r_x1": 286.36, "r_y1": 540.74, "r_x2": 286.36, "r_y2": 531.84, "r_x3": 62.07, "r_y3": 531.84, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 552.7, "r_x1": 286.37, "r_y1": 552.7, "r_x2": 286.37, "r_y2": 543.79, "r_x3": 50.11, "r_y3": 543.79, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 564.65, "r_x1": 114.03, "r_y1": 564.65, "r_x2": 114.03, "r_y2": 555.75, "r_x3": 50.11, "r_y3": 555.75, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 568.02, "r": 286.37, "b": 600.83, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 576.92, "r_x1": 69.54, "r_y1": 576.92, "r_x2": 69.54, "r_y2": 568.02, "r_x3": 62.07, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.73, "r_y0": 576.92, "r_x1": 286.37, "r_y1": 576.92, "r_x2": 286.37, "r_y2": 568.02, "r_x3": 76.73, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 588.88, "r_x1": 286.37, "r_y1": 588.88, "r_x2": 286.37, "r_y2": 579.97, "r_x3": 50.11, "r_y3": 579.97, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 600.83, "r_x1": 278.7, "r_y1": 600.83, "r_x2": 278.7, "r_y2": 591.93, "r_x3": 50.11, "r_y3": 591.93, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "formula", "bbox": { "l": 110.7, "t": 623.44, "r": 286.36, "b": 654.11, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.03, "r_y0": 632.84, "r_x1": 157.95, "r_y1": 632.84, "r_x2": 157.95, "r_y2": 623.99, "r_x3": 112.03, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.72, "r_y0": 632.84, "r_x1": 203.5, "r_y1": 632.84, "r_x2": 203.5, "r_y2": 623.99, "r_x3": 160.72, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 640.18, "r_x1": 189.15, "r_y1": 640.18, "r_x2": 189.15, "r_y2": 633.98, "r_x3": 185.58, "r_y3": 633.98, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.5, "r_y0": 632.84, "r_x1": 208.48, "r_y1": 632.84, "r_x2": 208.48, "r_y2": 623.44, "r_x3": 203.5, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48, "r_y0": 632.84, "r_x1": 220.29, "r_y1": 632.84, "r_x2": 220.29, "r_y2": 623.99, "r_x3": 208.48, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 632.84, "r_x1": 225.77, "r_y1": 632.84, "r_x2": 225.77, "r_y2": 623.44, "r_x3": 220.79, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.7, "r_y0": 654.11, "r_x1": 122.51, "r_y1": 654.11, "r_x2": 122.51, "r_y2": 645.26, "r_x3": 110.7, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.78, "r_y0": 654.11, "r_x1": 133.53, "r_y1": 654.11, "r_x2": 133.53, "r_y2": 645.26, "r_x3": 125.78, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.29, "r_y0": 654.11, "r_x1": 156.0, "r_y1": 654.11, "r_x2": 156.0, "r_y2": 645.26, "r_x3": 136.29, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.0, "r_y0": 654.11, "r_x1": 160.98, "r_y1": 654.11, "r_x2": 160.98, "r_y2": 644.7, "r_x3": 156.0, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98, "r_y0": 654.11, "r_x1": 170.24, "r_y1": 654.11, "r_x2": 170.24, "r_y2": 645.26, "r_x3": 160.98, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.74, "r_y0": 654.11, "r_x1": 185.68, "r_y1": 654.11, "r_x2": 185.68, "r_y2": 644.7, "r_x3": 170.74, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.89, "r_y0": 654.11, "r_x1": 206.05, "r_y1": 654.11, "r_x2": 206.05, "r_y2": 645.26, "r_x3": 187.89, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.05, "r_y0": 654.11, "r_x1": 211.04, "r_y1": 654.11, "r_x2": 211.04, "r_y2": 644.7, "r_x3": 206.05, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.03, "r_y0": 654.11, "r_x1": 220.29, "r_y1": 654.11, "r_x2": 220.29, "r_y2": 645.26, "r_x3": 211.03, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 654.11, "r_x1": 225.77, "r_y1": 654.11, "r_x2": 225.77, "r_y2": 644.7, "r_x3": 220.79, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 643.79, "r_x1": 286.36, "r_y1": 643.79, "r_x2": 286.36, "r_y2": 634.89, "r_x3": 274.75, "r_y3": 634.89, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 667.35, "r": 286.36, "b": 688.93, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 676.97, "r_x1": 74.45, "r_y1": 676.97, "r_x2": 74.45, "r_y2": 668.07, "r_x3": 50.11, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.34, "r_y0": 676.75, "r_x1": 82.65, "r_y1": 676.75, "r_x2": 82.65, "r_y2": 667.91, "r_x3": 78.34, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.53, "r_y0": 676.97, "r_x1": 123.63, "r_y1": 676.97, "r_x2": 123.63, "r_y2": 668.07, "r_x3": 86.53, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.52, "r_y0": 676.75, "r_x1": 132.5, "r_y1": 676.75, "r_x2": 132.5, "r_y2": 667.35, "r_x3": 127.52, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.5, "r_y0": 676.97, "r_x1": 210.7, "r_y1": 676.97, "r_x2": 210.7, "r_y2": 668.07, "r_x3": 132.5, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.7, "r_y0": 676.75, "r_x1": 215.68, "r_y1": 676.75, "r_x2": 215.68, "r_y2": 667.35, "r_x3": 210.7, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56, "r_y0": 676.97, "r_x1": 233.95, "r_y1": 676.97, "r_x2": 233.95, "r_y2": 668.07, "r_x3": 219.56, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83, "r_y0": 676.75, "r_x1": 247.09, "r_y1": 676.75, "r_x2": 247.09, "r_y2": 667.91, "r_x3": 237.83, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47, "r_y0": 676.97, "r_x1": 286.36, "r_y1": 676.97, "r_x2": 286.36, "r_y2": 668.07, "r_x3": 251.47, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 688.93, "r_x1": 205.89, "r_y1": 688.93, "r_x2": 205.89, "r_y2": 680.02, "r_x3": 50.11, "r_y3": 680.02, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 692.29, "r": 286.36, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 701.2, "r_x1": 69.54, "r_y1": 701.2, "r_x2": 69.54, "r_y2": 692.29, "r_x3": 62.07, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.27, "r_y0": 701.2, "r_x1": 286.36, "r_y1": 701.2, "r_x2": 286.36, "r_y2": 692.29, "r_x3": 76.27, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 94.6, "r_y1": 713.15, "r_x2": 94.6, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.6, "r_y0": 712.93, "r_x1": 103.29, "r_y1": 712.93, "r_x2": 103.29, "r_y2": 704.09, "r_x3": 97.6, "r_y3": 704.09, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.29, "r_y0": 713.15, "r_x1": 286.36, "r_y1": 713.15, "r_x2": 286.36, "r_y2": 704.25, "r_x3": 103.29, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 308.86, "t": 210.93, "r": 545.12, "b": 255.7, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 219.84, "r_x1": 545.12, "r_y1": 219.84, "r_x2": 545.12, "r_y2": 210.93, "r_x3": 308.86, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 231.79, "r_x1": 545.12, "r_y1": 231.79, "r_x2": 545.12, "r_y2": 222.89, "r_x3": 308.86, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 243.75, "r_x1": 545.12, "r_y1": 243.75, "r_x2": 545.12, "r_y2": 234.84, "r_x3": 308.86, "r_y3": 234.84, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 255.7, "r_x1": 339.58, "r_y1": 255.7, "r_x2": 339.58, "r_y2": 246.8, "r_x3": 308.86, "r_y3": 246.8, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 259.1, "r": 545.11, "b": 279.96, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 268.01, "r_x1": 328.29, "r_y1": 268.01, "r_x2": 328.29, "r_y2": 259.1, "r_x3": 320.82, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88, "r_y0": 268.01, "r_x1": 545.11, "r_y1": 268.01, "r_x2": 545.11, "r_y2": 259.1, "r_x3": 334.88, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 279.96, "r_x1": 338.19, "r_y1": 279.96, "r_x2": 338.19, "r_y2": 271.06, "r_x3": 308.86, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68, "r_y0": 279.74, "r_x1": 346.38, "r_y1": 279.74, "r_x2": 346.38, "r_y2": 270.9, "r_x3": 340.68, "r_y3": 270.9, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.38, "r_y0": 279.96, "r_x1": 453.72, "r_y1": 279.96, "r_x2": 453.72, "r_y2": 271.06, "r_x3": 346.38, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 283.36, "r": 545.12, "b": 387.91, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 292.27, "r_x1": 328.39, "r_y1": 292.27, "r_x2": 328.39, "r_y2": 283.36, "r_x3": 320.82, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.91, "r_y0": 292.27, "r_x1": 545.11, "r_y1": 292.27, "r_x2": 545.11, "r_y2": 283.36, "r_x3": 330.91, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.22, "r_x1": 545.12, "r_y1": 304.22, "r_x2": 545.12, "r_y2": 295.32, "r_x3": 308.86, "r_y3": 295.32, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.18, "r_x1": 545.12, "r_y1": 316.18, "r_x2": 545.12, "r_y2": 307.27, "r_x3": 308.86, "r_y3": 307.27, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.13, "r_x1": 545.12, "r_y1": 328.13, "r_x2": 545.12, "r_y2": 319.23, "r_x3": 308.86, "r_y3": 319.23, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 340.09, "r_x1": 397.19, "r_y1": 340.09, "r_x2": 397.19, "r_y2": 331.18, "r_x3": 308.86, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.66, "r_y0": 340.09, "r_x1": 545.12, "r_y1": 340.09, "r_x2": 545.12, "r_y2": 331.18, "r_x3": 403.66, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.05, "r_x1": 545.12, "r_y1": 352.05, "r_x2": 545.12, "r_y2": 343.14, "r_x3": 308.86, "r_y3": 343.14, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.0, "r_x1": 545.12, "r_y1": 364.0, "r_x2": 545.12, "r_y2": 355.09, "r_x3": 308.86, "r_y3": 355.09, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 375.96, "r_x1": 545.12, "r_y1": 375.96, "r_x2": 545.12, "r_y2": 367.05, "r_x3": 308.86, "r_y3": 367.05, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 387.91, "r_x1": 329.61, "r_y1": 387.91, "r_x2": 329.61, "r_y2": 379.0, "r_x3": 308.86, "r_y3": 379.0, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "list_item", "bbox": { "l": 308.86, "t": 391.31, "r": 545.12, "b": 459.99, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 400.22, "r_x1": 328.55, "r_y1": 400.22, "r_x2": 328.55, "r_y2": 391.31, "r_x3": 320.82, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13, "r_y0": 400.22, "r_x1": 545.12, "r_y1": 400.22, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 331.13, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.27, "r_x3": 308.86, "r_y3": 403.27, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.13, "r_x1": 545.12, "r_y1": 424.13, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.18, "r_x3": 308.86, "r_y3": 427.18, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.04, "r_x1": 545.12, "r_y1": 448.04, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 426.18, "r_y1": 459.99, "r_x2": 426.18, "r_y2": 451.09, "r_x3": 308.86, "r_y3": 451.09, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 463.39, "r": 545.12, "b": 567.94, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 472.3, "r_x1": 328.67, "r_y1": 472.3, "r_x2": 328.67, "r_y2": 463.39, "r_x3": 320.82, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29, "r_y0": 472.3, "r_x1": 545.11, "r_y1": 472.3, "r_x2": 545.11, "r_y2": 463.39, "r_x3": 331.29, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.25, "r_x1": 545.12, "r_y1": 484.25, "r_x2": 545.12, "r_y2": 475.35, "r_x3": 308.86, "r_y3": 475.35, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.21, "r_x1": 545.12, "r_y1": 496.21, "r_x2": 545.12, "r_y2": 487.3, "r_x3": 308.86, "r_y3": 487.3, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.16, "r_x1": 381.9, "r_y1": 508.16, "r_x2": 381.9, "r_y2": 499.26, "r_x3": 308.86, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 508.16, "r_x1": 545.12, "r_y1": 508.16, "r_x2": 545.12, "r_y2": 499.26, "r_x3": 388.7, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.12, "r_x1": 545.12, "r_y1": 520.12, "r_x2": 545.12, "r_y2": 511.21, "r_x3": 308.86, "r_y3": 511.21, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 532.07, "r_x1": 545.12, "r_y1": 532.07, "r_x2": 545.12, "r_y2": 523.17, "r_x3": 308.86, "r_y3": 523.17, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 544.03, "r_x1": 545.11, "r_y1": 544.03, "r_x2": 545.11, "r_y2": 535.12, "r_x3": 308.86, "r_y3": 535.12, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.98, "r_x1": 545.12, "r_y1": 555.98, "r_x2": 545.12, "r_y2": 547.08, "r_x3": 308.86, "r_y3": 547.08, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.94, "r_x1": 442.22, "r_y1": 567.94, "r_x2": 442.22, "r_y2": 559.03, "r_x3": 308.86, "r_y3": 559.03, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 308.86, "t": 571.34, "r": 545.12, "b": 604.15, "coord_origin": "TOPLEFT" }, "confidence": 0.846, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 580.24, "r_x1": 545.11, "r_y1": 580.24, "r_x2": 545.11, "r_y2": 571.34, "r_x3": 320.82, "r_y3": 571.34, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 592.2, "r_x1": 471.64, "r_y1": 592.2, "r_x2": 471.64, "r_y2": 583.29, "r_x3": 308.86, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83, "r_y0": 591.98, "r_x1": 479.72, "r_y1": 591.98, "r_x2": 479.72, "r_y2": 583.13, "r_x3": 474.83, "r_y3": 583.13, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.27, "r_y0": 592.2, "r_x1": 545.12, "r_y1": 592.2, "r_x2": 545.12, "r_y2": 583.29, "r_x3": 483.27, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 604.15, "r_x1": 329.91, "r_y1": 604.15, "r_x2": 329.91, "r_y2": 595.25, "r_x3": 308.86, "r_y3": 595.25, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 607.55, "r": 545.12, "b": 628.42, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 616.46, "r_x1": 332.87, "r_y1": 616.46, "r_x2": 332.87, "r_y2": 607.55, "r_x3": 320.82, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93, "r_y0": 616.46, "r_x1": 545.12, "r_y1": 616.46, "r_x2": 545.12, "r_y2": 607.55, "r_x3": 339.93, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 628.42, "r_x1": 495.29, "r_y1": 628.42, "r_x2": 495.29, "r_y2": 619.51, "r_x3": 308.86, "r_y3": 619.51, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 631.81, "r": 545.12, "b": 664.63, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 640.72, "r_x1": 545.12, "r_y1": 640.72, "r_x2": 545.12, "r_y2": 631.81, "r_x3": 320.82, "r_y3": 631.81, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 652.68, "r_x1": 455.28, "r_y1": 652.68, "r_x2": 455.28, "r_y2": 643.77, "r_x3": 308.86, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.78, "r_y0": 652.46, "r_x1": 463.47, "r_y1": 652.46, "r_x2": 463.47, "r_y2": 643.61, "r_x3": 457.78, "r_y3": 643.61, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97, "r_y0": 652.68, "r_x1": 545.11, "r_y1": 652.68, "r_x2": 545.11, "r_y2": 643.77, "r_x3": 465.97, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 664.63, "r_x1": 332.38, "r_y1": 664.63, "r_x2": 332.38, "r_y2": 655.72, "r_x3": 308.86, "r_y3": 655.72, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "list_item", "bbox": { "l": 308.86, "t": 668.03, "r": 545.11, "b": 688.89, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 676.94, "r_x1": 545.11, "r_y1": 676.94, "r_x2": 545.11, "r_y2": 668.03, "r_x3": 320.82, "r_y3": 668.03, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 688.89, "r_x1": 510.58, "r_y1": 688.89, "r_x2": 510.58, "r_y2": 679.99, "r_x3": 308.86, "r_y3": 679.99, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "list_item", "bbox": { "l": 308.86, "t": 692.29, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.697, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 320.82, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "picture", "id": 30, "page_no": 11, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 53.54, "t": 74.75, "r": 544.94, "b": 147.59, "coord_origin": "TOPLEFT" }, "confidence": 0.603, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39, "t": 77.31, "r": 151.95, "b": 83.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.35, "t": 75.19, "r": 59.33, "b": 81.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.58, "t": 77.46, "r": 319.83, "b": 83.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37, "t": 77.25, "r": 481.76, "b": 83.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.55, "t": 141.28, "r": 94.98, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.04, "t": 101.1, "r": 85.29, "b": 106.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.77, "t": 124.4, "r": 85.23, "b": 129.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55, "t": 102.54, "r": 249.8, "b": 107.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.2, "t": 126.99, "r": 249.66, "b": 131.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.23, "t": 114.05, "r": 413.7, "b": 119.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.38, "t": 141.28, "r": 105.08, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.94, "t": 85.73, "r": 76.15, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.3, "t": 86.22, "r": 106.99, "b": 91.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.21, "t": 141.61, "r": 281.88, "b": 146.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.7, "t": 85.73, "r": 241.91, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.94, "t": 86.09, "r": 282.49, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19, "t": 141.28, "r": 444.69, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37, "t": 85.73, "r": 432.67, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.61, "t": 86.26, "r": 445.62, "b": 91.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.95, "t": 141.29, "r": 136.2, "b": 146.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.92, "t": 94.82, "r": 127.05, "b": 99.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.31, "t": 100.94, "r": 127.05, "b": 105.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94, "t": 107.06, "r": 127.06, "b": 112.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.23, "t": 122.62, "r": 126.97, "b": 127.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85, "t": 128.74, "r": 126.97, "b": 133.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.58, "t": 141.44, "r": 156.04, "b": 146.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03, "t": 86.27, "r": 151.04, "b": 91.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65, "t": 86.55, "r": 321.67, "b": 91.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89, "t": 141.71, "r": 310.15, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.24, "t": 93.08, "r": 299.37, "b": 98.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.64, "t": 99.2, "r": 299.37, "b": 104.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26, "t": 105.32, "r": 299.38, "b": 110.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43, "t": 120.39, "r": 299.17, "b": 125.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.06, "t": 126.51, "r": 299.17, "b": 131.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.35, "t": 141.71, "r": 328.81, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58, "t": 86.69, "r": 309.6, "b": 91.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04, "t": 141.67, "r": 483.5, "b": 146.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02, "t": 93.76, "r": 469.16, "b": 98.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.42, "t": 99.88, "r": 469.16, "b": 104.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.05, "t": 106.0, "r": 469.16, "b": 110.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39, "t": 85.57, "r": 480.65, "b": 90.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.38, "t": 141.58, "r": 182.63, "b": 146.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74, "t": 94.86, "r": 173.33, "b": 99.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.51, "t": 100.98, "r": 173.32, "b": 105.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27, "t": 107.1, "r": 173.33, "b": 112.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41, "t": 107.23, "r": 346.0, "b": 112.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.18, "t": 113.35, "r": 345.99, "b": 118.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94, "t": 119.47, "r": 346.0, "b": 124.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.99, "t": 104.15, "r": 508.76, "b": 109.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.19, "t": 110.27, "r": 508.76, "b": 115.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72, "t": 116.39, "r": 508.77, "b": 121.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71, "t": 122.51, "r": 508.77, "b": 127.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.38, "t": 141.71, "r": 202.84, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.5, "t": 86.14, "r": 197.53, "b": 91.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.38, "t": 86.0, "r": 367.4, "b": 90.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73, "t": 141.62, "r": 374.93, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69, "t": 86.06, "r": 355.71, "b": 91.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54, "t": 141.38, "r": 526.01, "b": 146.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.45, "t": 86.09, "r": 523.71, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 50.11, "t": 165.5, "r": 545.11, "b": 186.36, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 174.41, "r_x1": 545.11, "r_y1": 174.41, "r_x2": 545.11, "r_y2": 165.5, "r_x3": 50.11, "r_y3": 165.5, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 186.36, "r_x1": 513.52, "r_y1": 186.36, "r_x2": 513.52, "r_y2": 177.46, "r_x3": 50.11, "r_y3": 177.46, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity." }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 61.57, "t": 210.93, "r": 286.37, "b": 231.79, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 219.84, "r_x1": 71.15, "r_y1": 219.84, "r_x2": 71.15, "r_y2": 210.93, "r_x3": 61.57, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.54, "r_y0": 219.84, "r_x1": 286.37, "r_y1": 219.84, "r_x2": 286.37, "r_y2": 210.93, "r_x3": 73.54, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 231.79, "r_x1": 87.47, "r_y1": 231.79, "r_x2": 87.47, "r_y2": 222.89, "r_x3": 70.04, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 TableFormer output does not include the table cell content." }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 61.57, "t": 244.07, "r": 286.37, "b": 264.93, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 252.98, "r_x1": 71.35, "r_y1": 252.98, "r_x2": 71.35, "r_y2": 244.07, "r_x3": 61.57, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.79, "r_y0": 252.98, "r_x1": 286.37, "r_y1": 252.98, "r_x2": 286.37, "r_y2": 244.07, "r_x3": 73.79, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 264.93, "r_x1": 150.42, "r_y1": 264.93, "r_x2": 150.42, "r_y2": 256.03, "r_x3": 70.04, "r_y3": 256.03, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 279.2, "r": 286.37, "b": 395.71, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 288.11, "r_x1": 286.36, "r_y1": 288.11, "r_x2": 286.36, "r_y2": 279.2, "r_x3": 62.07, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.06, "r_x1": 286.37, "r_y1": 300.06, "r_x2": 286.37, "r_y2": 291.16, "r_x3": 50.11, "r_y3": 291.16, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.02, "r_x1": 286.37, "r_y1": 312.02, "r_x2": 286.37, "r_y2": 303.11, "r_x3": 50.11, "r_y3": 303.11, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.97, "r_x1": 286.37, "r_y1": 323.97, "r_x2": 286.37, "r_y2": 315.07, "r_x3": 50.11, "r_y3": 315.07, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.93, "r_x1": 286.37, "r_y1": 335.93, "r_x2": 286.37, "r_y2": 327.02, "r_x3": 50.11, "r_y3": 327.02, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.89, "r_x1": 286.37, "r_y1": 347.89, "r_x2": 286.37, "r_y2": 338.98, "r_x3": 50.11, "r_y3": 338.98, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.84, "r_x1": 286.37, "r_y1": 359.84, "r_x2": 286.37, "r_y2": 350.93, "r_x3": 50.11, "r_y3": 350.93, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.8, "r_x1": 286.37, "r_y1": 371.8, "r_x2": 286.37, "r_y2": 362.89, "r_x3": 50.11, "r_y3": 362.89, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.75, "r_x1": 286.37, "r_y1": 383.75, "r_x2": 286.37, "r_y2": 374.84, "r_x3": 50.11, "r_y3": 374.84, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.71, "r_x1": 154.56, "r_y1": 395.71, "r_x2": 154.56, "r_y2": 386.8, "r_x3": 50.11, "r_y3": 386.8, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes." }, { "label": "text", "id": 11, "page_no": 11, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 399.07, "r": 286.36, "b": 419.93, "coord_origin": "TOPLEFT" }, "confidence": 0.935, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 407.98, "r_x1": 286.36, "r_y1": 407.98, "r_x2": 286.36, "r_y2": 399.07, "r_x3": 62.07, "r_y3": 399.07, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 419.93, "r_x1": 95.49, "r_y1": 419.93, "r_x2": 95.49, "r_y2": 411.03, "r_x3": 50.11, "r_y3": 411.03, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Here is a step-by-step description of the prediction postprocessing:" }, { "label": "list_item", "id": 20, "page_no": 11, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 50.11, "t": 423.3, "r": 286.37, "b": 456.11, "coord_origin": "TOPLEFT" }, "confidence": 0.828, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 432.2, "r_x1": 69.37, "r_y1": 432.2, "r_x2": 69.37, "r_y2": 423.3, "r_x3": 62.07, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.81, "r_y0": 432.2, "r_x1": 286.37, "r_y1": 432.2, "r_x2": 286.37, "r_y2": 423.3, "r_x3": 71.81, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.16, "r_x1": 286.37, "r_y1": 444.16, "r_x2": 286.37, "r_y2": 435.25, "r_x3": 50.11, "r_y3": 435.25, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 456.11, "r_x1": 274.51, "r_y1": 456.11, "r_x2": 274.51, "r_y2": 447.21, "r_x3": 50.11, "r_y3": 447.21, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure." }, { "label": "list_item", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 459.48, "r": 286.37, "b": 504.25, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 468.38, "r_x1": 69.54, "r_y1": 468.38, "r_x2": 69.54, "r_y2": 459.48, "r_x3": 62.07, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.43, "r_y0": 468.38, "r_x1": 286.36, "r_y1": 468.38, "r_x2": 286.36, "r_y2": 459.48, "r_x3": 77.43, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 480.34, "r_x1": 286.37, "r_y1": 480.34, "r_x2": 286.37, "r_y2": 471.43, "r_x3": 50.11, "r_y3": 471.43, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.29, "r_x1": 286.37, "r_y1": 492.29, "r_x2": 286.37, "r_y2": 483.39, "r_x3": 50.11, "r_y3": 483.39, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 504.25, "r_x1": 110.7, "r_y1": 504.25, "r_x2": 110.7, "r_y2": 495.34, "r_x3": 50.11, "r_y3": 495.34, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches." }, { "label": "list_item", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 507.61, "r": 286.36, "b": 528.47, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 516.52, "r_x1": 69.86, "r_y1": 516.52, "r_x2": 69.86, "r_y2": 507.61, "r_x3": 62.07, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.46, "r_y0": 516.52, "r_x1": 286.36, "r_y1": 516.52, "r_x2": 286.36, "r_y2": 507.61, "r_x3": 72.46, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 528.47, "r_x1": 226.07, "r_y1": 528.47, "r_x2": 226.07, "r_y2": 519.57, "r_x3": 50.11, "r_y3": 519.57, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones." }, { "label": "list_item", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 531.84, "r": 286.37, "b": 564.65, "coord_origin": "TOPLEFT" }, "confidence": 0.949, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 540.74, "r_x1": 286.36, "r_y1": 540.74, "r_x2": 286.36, "r_y2": 531.84, "r_x3": 62.07, "r_y3": 531.84, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 552.7, "r_x1": 286.37, "r_y1": 552.7, "r_x2": 286.37, "r_y2": 543.79, "r_x3": 50.11, "r_y3": 543.79, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 564.65, "r_x1": 114.03, "r_y1": 564.65, "r_x2": 114.03, "r_y2": 555.75, "r_x3": 50.11, "r_y3": 555.75, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column." }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 568.02, "r": 286.37, "b": 600.83, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 576.92, "r_x1": 69.54, "r_y1": 576.92, "r_x2": 69.54, "r_y2": 568.02, "r_x3": 62.07, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.73, "r_y0": 576.92, "r_x1": 286.37, "r_y1": 576.92, "r_x2": 286.37, "r_y2": 568.02, "r_x3": 76.73, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 588.88, "r_x1": 286.37, "r_y1": 588.88, "r_x2": 286.37, "r_y2": 579.97, "r_x3": 50.11, "r_y3": 579.97, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 600.83, "r_x1": 278.7, "r_y1": 600.83, "r_x2": 278.7, "r_y2": 591.93, "r_x3": 50.11, "r_y3": 591.93, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:" }, { "label": "formula", "id": 12, "page_no": 11, "cluster": { "id": 12, "label": "formula", "bbox": { "l": 110.7, "t": 623.44, "r": 286.36, "b": 654.11, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.03, "r_y0": 632.84, "r_x1": 157.95, "r_y1": 632.84, "r_x2": 157.95, "r_y2": 623.99, "r_x3": 112.03, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.72, "r_y0": 632.84, "r_x1": 203.5, "r_y1": 632.84, "r_x2": 203.5, "r_y2": 623.99, "r_x3": 160.72, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 640.18, "r_x1": 189.15, "r_y1": 640.18, "r_x2": 189.15, "r_y2": 633.98, "r_x3": 185.58, "r_y3": 633.98, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.5, "r_y0": 632.84, "r_x1": 208.48, "r_y1": 632.84, "r_x2": 208.48, "r_y2": 623.44, "r_x3": 203.5, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48, "r_y0": 632.84, "r_x1": 220.29, "r_y1": 632.84, "r_x2": 220.29, "r_y2": 623.99, "r_x3": 208.48, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 632.84, "r_x1": 225.77, "r_y1": 632.84, "r_x2": 225.77, "r_y2": 623.44, "r_x3": 220.79, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.7, "r_y0": 654.11, "r_x1": 122.51, "r_y1": 654.11, "r_x2": 122.51, "r_y2": 645.26, "r_x3": 110.7, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.78, "r_y0": 654.11, "r_x1": 133.53, "r_y1": 654.11, "r_x2": 133.53, "r_y2": 645.26, "r_x3": 125.78, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.29, "r_y0": 654.11, "r_x1": 156.0, "r_y1": 654.11, "r_x2": 156.0, "r_y2": 645.26, "r_x3": 136.29, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.0, "r_y0": 654.11, "r_x1": 160.98, "r_y1": 654.11, "r_x2": 160.98, "r_y2": 644.7, "r_x3": 156.0, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98, "r_y0": 654.11, "r_x1": 170.24, "r_y1": 654.11, "r_x2": 170.24, "r_y2": 645.26, "r_x3": 160.98, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.74, "r_y0": 654.11, "r_x1": 185.68, "r_y1": 654.11, "r_x2": 185.68, "r_y2": 644.7, "r_x3": 170.74, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.89, "r_y0": 654.11, "r_x1": 206.05, "r_y1": 654.11, "r_x2": 206.05, "r_y2": 645.26, "r_x3": 187.89, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.05, "r_y0": 654.11, "r_x1": 211.04, "r_y1": 654.11, "r_x2": 211.04, "r_y2": 644.7, "r_x3": 206.05, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.03, "r_y0": 654.11, "r_x1": 220.29, "r_y1": 654.11, "r_x2": 220.29, "r_y2": 645.26, "r_x3": 211.03, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 654.11, "r_x1": 225.77, "r_y1": 654.11, "r_x2": 225.77, "r_y2": 644.7, "r_x3": 220.79, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 643.79, "r_x1": 286.36, "r_y1": 643.79, "r_x2": 286.36, "r_y2": 634.89, "r_x3": 274.75, "r_y3": 634.89, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)" }, { "label": "text", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 667.35, "r": 286.36, "b": 688.93, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 676.97, "r_x1": 74.45, "r_y1": 676.97, "r_x2": 74.45, "r_y2": 668.07, "r_x3": 50.11, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.34, "r_y0": 676.75, "r_x1": 82.65, "r_y1": 676.75, "r_x2": 82.65, "r_y2": 667.91, "r_x3": 78.34, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.53, "r_y0": 676.97, "r_x1": 123.63, "r_y1": 676.97, "r_x2": 123.63, "r_y2": 668.07, "r_x3": 86.53, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.52, "r_y0": 676.75, "r_x1": 132.5, "r_y1": 676.75, "r_x2": 132.5, "r_y2": 667.35, "r_x3": 127.52, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.5, "r_y0": 676.97, "r_x1": 210.7, "r_y1": 676.97, "r_x2": 210.7, "r_y2": 668.07, "r_x3": 132.5, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.7, "r_y0": 676.75, "r_x1": 215.68, "r_y1": 676.75, "r_x2": 215.68, "r_y2": 667.35, "r_x3": 210.7, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56, "r_y0": 676.97, "r_x1": 233.95, "r_y1": 676.97, "r_x2": 233.95, "r_y2": 668.07, "r_x3": 219.56, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83, "r_y0": 676.75, "r_x1": 247.09, "r_y1": 676.75, "r_x2": 247.09, "r_y2": 667.91, "r_x3": 237.83, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47, "r_y0": 676.97, "r_x1": 286.36, "r_y1": 676.97, "r_x2": 286.36, "r_y2": 668.07, "r_x3": 251.47, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 688.93, "r_x1": 205.89, "r_y1": 688.93, "r_x2": 205.89, "r_y2": 680.02, "r_x3": 50.11, "r_y3": 680.02, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point." }, { "label": "list_item", "id": 13, "page_no": 11, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 692.29, "r": 286.36, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 701.2, "r_x1": 69.54, "r_y1": 701.2, "r_x2": 69.54, "r_y2": 692.29, "r_x3": 62.07, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.27, "r_y0": 701.2, "r_x1": 286.36, "r_y1": 701.2, "r_x2": 286.36, "r_y2": 692.29, "r_x3": 76.27, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 94.6, "r_y1": 713.15, "r_x2": 94.6, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.6, "r_y0": 712.93, "r_x1": 103.29, "r_y1": 712.93, "r_x2": 103.29, "r_y2": 704.09, "r_x3": 97.6, "r_y3": 704.09, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.29, "r_y0": 713.15, "r_x1": 286.36, "r_y1": 713.15, "r_x2": 286.36, "r_y2": 704.25, "r_x3": 103.29, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-" }, { "label": "text", "id": 16, "page_no": 11, "cluster": { "id": 16, "label": "text", "bbox": { "l": 308.86, "t": 210.93, "r": 545.12, "b": 255.7, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 219.84, "r_x1": 545.12, "r_y1": 219.84, "r_x2": 545.12, "r_y2": 210.93, "r_x3": 308.86, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 231.79, "r_x1": 545.12, "r_y1": 231.79, "r_x2": 545.12, "r_y2": 222.89, "r_x3": 308.86, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 243.75, "r_x1": 545.12, "r_y1": 243.75, "r_x2": 545.12, "r_y2": 234.84, "r_x3": 308.86, "r_y3": 234.84, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 255.7, "r_x1": 339.58, "r_y1": 255.7, "r_x2": 339.58, "r_y2": 246.8, "r_x3": 308.86, "r_y3": 246.8, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal." }, { "label": "list_item", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 259.1, "r": 545.11, "b": 279.96, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 268.01, "r_x1": 328.29, "r_y1": 268.01, "r_x2": 328.29, "r_y2": 259.1, "r_x3": 320.82, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88, "r_y0": 268.01, "r_x1": 545.11, "r_y1": 268.01, "r_x2": 545.11, "r_y2": 259.1, "r_x3": 334.88, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 279.96, "r_x1": 338.19, "r_y1": 279.96, "r_x2": 338.19, "r_y2": 271.06, "r_x3": 308.86, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68, "r_y0": 279.74, "r_x1": 346.38, "r_y1": 279.74, "r_x2": 346.38, "r_y2": 270.9, "r_x3": 340.68, "r_y3": 270.9, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.38, "r_y0": 279.96, "r_x1": 453.72, "r_y1": 279.96, "r_x2": 453.72, "r_y2": 271.06, "r_x3": 346.38, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes." }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 283.36, "r": 545.12, "b": 387.91, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 292.27, "r_x1": 328.39, "r_y1": 292.27, "r_x2": 328.39, "r_y2": 283.36, "r_x3": 320.82, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.91, "r_y0": 292.27, "r_x1": 545.11, "r_y1": 292.27, "r_x2": 545.11, "r_y2": 283.36, "r_x3": 330.91, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.22, "r_x1": 545.12, "r_y1": 304.22, "r_x2": 545.12, "r_y2": 295.32, "r_x3": 308.86, "r_y3": 295.32, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.18, "r_x1": 545.12, "r_y1": 316.18, "r_x2": 545.12, "r_y2": 307.27, "r_x3": 308.86, "r_y3": 307.27, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.13, "r_x1": 545.12, "r_y1": 328.13, "r_x2": 545.12, "r_y2": 319.23, "r_x3": 308.86, "r_y3": 319.23, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 340.09, "r_x1": 397.19, "r_y1": 340.09, "r_x2": 397.19, "r_y2": 331.18, "r_x3": 308.86, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.66, "r_y0": 340.09, "r_x1": 545.12, "r_y1": 340.09, "r_x2": 545.12, "r_y2": 331.18, "r_x3": 403.66, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.05, "r_x1": 545.12, "r_y1": 352.05, "r_x2": 545.12, "r_y2": 343.14, "r_x3": 308.86, "r_y3": 343.14, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.0, "r_x1": 545.12, "r_y1": 364.0, "r_x2": 545.12, "r_y2": 355.09, "r_x3": 308.86, "r_y3": 355.09, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 375.96, "r_x1": 545.12, "r_y1": 375.96, "r_x2": 545.12, "r_y2": 367.05, "r_x3": 308.86, "r_y3": 367.05, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 387.91, "r_x1": 329.61, "r_y1": 387.91, "r_x2": 329.61, "r_y2": 379.0, "r_x3": 308.86, "r_y3": 379.0, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells." }, { "label": "list_item", "id": 17, "page_no": 11, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 308.86, "t": 391.31, "r": 545.12, "b": 459.99, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 400.22, "r_x1": 328.55, "r_y1": 400.22, "r_x2": 328.55, "r_y2": 391.31, "r_x3": 320.82, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13, "r_y0": 400.22, "r_x1": 545.12, "r_y1": 400.22, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 331.13, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.27, "r_x3": 308.86, "r_y3": 403.27, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.13, "r_x1": 545.12, "r_y1": 424.13, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.18, "r_x3": 308.86, "r_y3": 427.18, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.04, "r_x1": 545.12, "r_y1": 448.04, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 426.18, "r_y1": 459.99, "r_x2": 426.18, "r_y2": 451.09, "r_x3": 308.86, "r_y3": 451.09, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score." }, { "label": "list_item", "id": 15, "page_no": 11, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 463.39, "r": 545.12, "b": 567.94, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 472.3, "r_x1": 328.67, "r_y1": 472.3, "r_x2": 328.67, "r_y2": 463.39, "r_x3": 320.82, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29, "r_y0": 472.3, "r_x1": 545.11, "r_y1": 472.3, "r_x2": 545.11, "r_y2": 463.39, "r_x3": 331.29, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.25, "r_x1": 545.12, "r_y1": 484.25, "r_x2": 545.12, "r_y2": 475.35, "r_x3": 308.86, "r_y3": 475.35, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.21, "r_x1": 545.12, "r_y1": 496.21, "r_x2": 545.12, "r_y2": 487.3, "r_x3": 308.86, "r_y3": 487.3, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.16, "r_x1": 381.9, "r_y1": 508.16, "r_x2": 381.9, "r_y2": 499.26, "r_x3": 308.86, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 508.16, "r_x1": 545.12, "r_y1": 508.16, "r_x2": 545.12, "r_y2": 499.26, "r_x3": 388.7, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.12, "r_x1": 545.12, "r_y1": 520.12, "r_x2": 545.12, "r_y2": 511.21, "r_x3": 308.86, "r_y3": 511.21, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 532.07, "r_x1": 545.12, "r_y1": 532.07, "r_x2": 545.12, "r_y2": 523.17, "r_x3": 308.86, "r_y3": 523.17, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 544.03, "r_x1": 545.11, "r_y1": 544.03, "r_x2": 545.11, "r_y2": 535.12, "r_x3": 308.86, "r_y3": 535.12, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.98, "r_x1": 545.12, "r_y1": 555.98, "r_x2": 545.12, "r_y2": 547.08, "r_x3": 308.86, "r_y3": 547.08, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.94, "r_x1": 442.22, "r_y1": 567.94, "r_x2": 442.22, "r_y2": 559.03, "r_x3": 308.86, "r_y3": 559.03, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan." }, { "label": "text", "id": 19, "page_no": 11, "cluster": { "id": 19, "label": "text", "bbox": { "l": 308.86, "t": 571.34, "r": 545.12, "b": 604.15, "coord_origin": "TOPLEFT" }, "confidence": 0.846, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 580.24, "r_x1": 545.11, "r_y1": 580.24, "r_x2": 545.11, "r_y2": 571.34, "r_x3": 320.82, "r_y3": 571.34, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 592.2, "r_x1": 471.64, "r_y1": 592.2, "r_x2": 471.64, "r_y2": 583.29, "r_x3": 308.86, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83, "r_y0": 591.98, "r_x1": 479.72, "r_y1": 591.98, "r_x2": 479.72, "r_y2": 583.13, "r_x3": 474.83, "r_y3": 583.13, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.27, "r_y0": 592.2, "r_x1": 545.12, "r_y1": 592.2, "r_x2": 545.12, "r_y2": 583.29, "r_x3": 483.27, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 604.15, "r_x1": 329.91, "r_y1": 604.15, "r_x2": 329.91, "r_y2": 595.25, "r_x3": 308.86, "r_y3": 595.25, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)." }, { "label": "list_item", "id": 21, "page_no": 11, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 607.55, "r": 545.12, "b": 628.42, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 616.46, "r_x1": 332.87, "r_y1": 616.46, "r_x2": 332.87, "r_y2": 607.55, "r_x3": 320.82, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93, "r_y0": 616.46, "r_x1": 545.12, "r_y1": 616.46, "r_x2": 545.12, "r_y2": 607.55, "r_x3": 339.93, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 628.42, "r_x1": 495.29, "r_y1": 628.42, "r_x2": 495.29, "r_y2": 619.51, "r_x3": 308.86, "r_y3": 619.51, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row." }, { "label": "list_item", "id": 18, "page_no": 11, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 631.81, "r": 545.12, "b": 664.63, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 640.72, "r_x1": 545.12, "r_y1": 640.72, "r_x2": 545.12, "r_y2": 631.81, "r_x3": 320.82, "r_y3": 631.81, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 652.68, "r_x1": 455.28, "r_y1": 652.68, "r_x2": 455.28, "r_y2": 643.77, "r_x3": 308.86, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.78, "r_y0": 652.46, "r_x1": 463.47, "r_y1": 652.46, "r_x2": 463.47, "r_y2": 643.61, "r_x3": 457.78, "r_y3": 643.61, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97, "r_y0": 652.68, "r_x1": 545.11, "r_y1": 652.68, "r_x2": 545.11, "r_y2": 643.77, "r_x3": 465.97, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 664.63, "r_x1": 332.38, "r_y1": 664.63, "r_x2": 332.38, "r_y2": 655.72, "r_x3": 308.86, "r_y3": 655.72, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)." }, { "label": "list_item", "id": 22, "page_no": 11, "cluster": { "id": 22, "label": "list_item", "bbox": { "l": 308.86, "t": 668.03, "r": 545.11, "b": 688.89, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 676.94, "r_x1": 545.11, "r_y1": 676.94, "r_x2": 545.11, "r_y2": 668.03, "r_x3": 320.82, "r_y3": 668.03, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 688.89, "r_x1": 510.58, "r_y1": 688.89, "r_x2": 510.58, "r_y2": 679.99, "r_x3": 308.86, "r_y3": 679.99, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column." }, { "label": "list_item", "id": 25, "page_no": 11, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 308.86, "t": 692.29, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.697, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 320.82, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-" }, { "label": "page_footer", "id": 14, "page_no": 11, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" } ], "body": [ { "label": "picture", "id": 30, "page_no": 11, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 53.54, "t": 74.75, "r": 544.94, "b": 147.59, "coord_origin": "TOPLEFT" }, "confidence": 0.603, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 46, "label": "text", "bbox": { "l": 119.39, "t": 77.31, "r": 151.95, "b": 83.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 119.39, "r_y0": 83.26, "r_x1": 151.95, "r_y1": 83.26, "r_x2": 151.95, "r_y2": 77.31, "r_x3": 119.39, "r_y3": 77.31, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 53.35, "t": 75.19, "r": 59.33, "b": 81.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 53.35, "r_y0": 81.14, "r_x1": 59.33, "r_y1": 81.14, "r_x2": 59.33, "r_y2": 75.19, "r_x3": 53.35, "r_y3": 75.19, "coord_origin": "TOPLEFT" }, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 289.58, "t": 77.46, "r": 319.83, "b": 83.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.58, "r_y0": 83.41, "r_x1": 319.83, "r_y1": 83.41, "r_x2": 319.83, "r_y2": 77.46, "r_x3": 289.58, "r_y3": 77.46, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 448.37, "t": 77.25, "r": 481.76, "b": 83.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.37, "r_y0": 83.2, "r_x1": 481.76, "r_y1": 83.2, "r_x2": 481.76, "r_y2": 77.25, "r_x3": 448.37, "r_y3": 77.25, "coord_origin": "TOPLEFT" }, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 82.55, "t": 141.28, "r": 94.98, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.55, "r_y0": 146.23, "r_x1": 94.98, "r_y1": 146.23, "r_x2": 94.98, "r_y2": 141.28, "r_x3": 82.55, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train", "orig": "Train", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 63.04, "t": 101.1, "r": 85.29, "b": 106.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.04, "r_y0": 106.06, "r_x1": 85.29, "r_y1": 106.06, "r_x2": 85.29, "r_y2": 101.1, "r_x3": 63.04, "r_y3": 101.1, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 67.77, "t": 124.4, "r": 85.23, "b": 129.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 67.77, "r_y0": 129.35, "r_x1": 85.23, "r_y1": 129.35, "r_x2": 85.23, "r_y2": 124.4, "r_x3": 67.77, "r_y3": 124.4, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 227.55, "t": 102.54, "r": 249.8, "b": 107.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.55, "r_y0": 107.5, "r_x1": 249.8, "r_y1": 107.5, "r_x2": 249.8, "r_y2": 102.54, "r_x3": 227.55, "r_y3": 102.54, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 232.2, "t": 126.99, "r": 249.66, "b": 131.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.2, "r_y0": 131.94, "r_x1": 249.66, "r_y1": 131.94, "r_x2": 249.66, "r_y2": 126.99, "r_x3": 232.2, "r_y3": 126.99, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 396.23, "t": 114.05, "r": 413.7, "b": 119.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.23, "r_y0": 119.0, "r_x1": 413.7, "r_y1": 119.0, "r_x2": 413.7, "r_y2": 114.05, "r_x3": 396.23, "r_y3": 114.05, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 97.38, "t": 141.28, "r": 105.08, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.38, "r_y0": 146.23, "r_x1": 105.08, "r_y1": 146.23, "r_x2": 105.08, "r_y2": 141.28, "r_x3": 97.38, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 60.94, "t": 85.73, "r": 76.15, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 60.94, "r_y0": 90.69, "r_x1": 76.15, "r_y1": 90.69, "r_x2": 76.15, "r_y2": 85.73, "r_x3": 60.94, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 82.3, "t": 86.22, "r": 106.99, "b": 91.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 82.3, "r_y0": 91.18, "r_x1": 106.99, "r_y1": 91.18, "r_x2": 106.99, "r_y2": 86.22, "r_x3": 82.3, "r_y3": 86.22, "coord_origin": "TOPLEFT" }, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 246.21, "t": 141.61, "r": 281.88, "b": 146.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.21, "r_y0": 146.56, "r_x1": 281.88, "r_y1": 146.56, "r_x2": 281.88, "r_y2": 141.61, "r_x3": 246.21, "r_y3": 141.61, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 226.7, "t": 85.73, "r": 241.91, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 226.7, "r_y0": 90.69, "r_x1": 241.91, "r_y1": 90.69, "r_x2": 241.91, "r_y2": 85.73, "r_x3": 226.7, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 249.94, "t": 86.09, "r": 282.49, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.94, "r_y0": 91.05, "r_x1": 282.49, "r_y1": 91.05, "r_x2": 282.49, "r_y2": 86.09, "r_x3": 249.94, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "91K 10K 10K", "orig": "91K 10K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 410.19, "t": 141.28, "r": 444.69, "b": 146.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.19, "r_y0": 146.23, "r_x1": 444.69, "r_y1": 146.23, "r_x2": 444.69, "r_y2": 141.28, "r_x3": 410.19, "r_y3": 141.28, "coord_origin": "TOPLEFT" }, "text": "Train Test Val", "orig": "Train Test Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 391.37, "t": 85.73, "r": 432.67, "b": 90.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.37, "r_y0": 90.69, "r_x1": 432.67, "r_y1": 90.69, "r_x2": 432.67, "r_y2": 85.73, "r_x3": 391.37, "r_y3": 85.73, "coord_origin": "TOPLEFT" }, "text": "100% 130K 5K", "orig": "100% 130K 5K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 435.61, "t": 86.26, "r": 445.62, "b": 91.22, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.61, "r_y0": 91.22, "r_x1": 445.62, "r_y1": 91.22, "r_x2": 445.62, "r_y2": 86.26, "r_x3": 435.61, "r_y3": 86.26, "coord_origin": "TOPLEFT" }, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 113.95, "t": 141.29, "r": 136.2, "b": 146.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.95, "r_y0": 146.25, "r_x1": 136.2, "r_y1": 146.25, "r_x2": 136.2, "r_y2": 141.29, "r_x3": 113.95, "r_y3": 141.29, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 116.92, "t": 94.82, "r": 127.05, "b": 99.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 116.92, "r_y0": 99.78, "r_x1": 127.05, "r_y1": 99.78, "r_x2": 127.05, "r_y2": 94.82, "r_x3": 116.92, "r_y3": 94.82, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 113.31, "t": 100.94, "r": 127.05, "b": 105.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.31, "r_y0": 105.9, "r_x1": 127.05, "r_y1": 105.9, "r_x2": 127.05, "r_y2": 100.94, "r_x3": 113.31, "r_y3": 100.94, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 112.94, "t": 107.06, "r": 127.06, "b": 112.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.94, "r_y0": 112.02, "r_x1": 127.06, "r_y1": 112.02, "r_x2": 127.06, "r_y2": 107.06, "r_x3": 112.94, "r_y3": 107.06, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 113.23, "t": 122.62, "r": 126.97, "b": 127.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 113.23, "r_y0": 127.57, "r_x1": 126.97, "r_y1": 127.57, "r_x2": 126.97, "r_y2": 122.62, "r_x3": 113.23, "r_y3": 122.62, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 112.85, "t": 128.74, "r": 126.97, "b": 133.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.85, "r_y0": 133.69, "r_x1": 126.97, "r_y1": 133.69, "r_x2": 126.97, "r_y2": 128.74, "r_x3": 112.85, "r_y3": 128.74, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 138.58, "t": 141.44, "r": 156.04, "b": 146.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.58, "r_y0": 146.39, "r_x1": 156.04, "r_y1": 146.39, "r_x2": 156.04, "r_y2": 141.44, "r_x3": 138.58, "r_y3": 141.44, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 122.03, "t": 86.27, "r": 151.04, "b": 91.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 122.03, "r_y0": 91.23, "r_x1": 151.04, "r_y1": 91.23, "r_x2": 151.04, "r_y2": 86.27, "r_x3": 122.03, "r_y3": 86.27, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 311.65, "t": 86.55, "r": 321.67, "b": 91.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.65, "r_y0": 91.51, "r_x1": 321.67, "r_y1": 91.51, "r_x2": 321.67, "r_y2": 86.55, "r_x3": 311.65, "r_y3": 86.55, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 287.89, "t": 141.71, "r": 310.15, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.89, "r_y0": 146.67, "r_x1": 310.15, "r_y1": 146.67, "r_x2": 310.15, "r_y2": 141.71, "r_x3": 287.89, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.24, "t": 93.08, "r": 299.37, "b": 98.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.24, "r_y0": 98.04, "r_x1": 299.37, "r_y1": 98.04, "r_x2": 299.37, "r_y2": 93.08, "r_x3": 289.24, "r_y3": 93.08, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 285.64, "t": 99.2, "r": 299.37, "b": 104.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 104.16, "r_x1": 299.37, "r_y1": 104.16, "r_x2": 299.37, "r_y2": 99.2, "r_x3": 285.64, "r_y3": 99.2, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 285.26, "t": 105.32, "r": 299.38, "b": 110.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.26, "r_y0": 110.28, "r_x1": 299.38, "r_y1": 110.28, "r_x2": 299.38, "r_y2": 105.32, "r_x3": 285.26, "r_y3": 105.32, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 285.43, "t": 120.39, "r": 299.17, "b": 125.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.43, "r_y0": 125.35, "r_x1": 299.17, "r_y1": 125.35, "r_x2": 299.17, "r_y2": 120.39, "r_x3": 285.43, "r_y3": 120.39, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 285.06, "t": 126.51, "r": 299.17, "b": 131.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.06, "r_y0": 131.47, "r_x1": 299.17, "r_y1": 131.47, "r_x2": 299.17, "r_y2": 126.51, "r_x3": 285.06, "r_y3": 126.51, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 311.35, "t": 141.71, "r": 328.81, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 311.35, "r_y0": 146.67, "r_x1": 328.81, "r_y1": 146.67, "r_x2": 328.81, "r_y2": 141.71, "r_x3": 311.35, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 299.58, "t": 86.69, "r": 309.6, "b": 91.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 299.58, "r_y0": 91.65, "r_x1": 309.6, "r_y1": 91.65, "r_x2": 309.6, "r_y2": 86.69, "r_x3": 299.58, "r_y3": 86.69, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 466.04, "t": 141.67, "r": 483.5, "b": 146.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 466.04, "r_y0": 146.63, "r_x1": 483.5, "r_y1": 146.63, "r_x2": 483.5, "r_y2": 141.67, "r_x3": 466.04, "r_y3": 141.67, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 459.02, "t": 93.76, "r": 469.16, "b": 98.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 459.02, "r_y0": 98.72, "r_x1": 469.16, "r_y1": 98.72, "r_x2": 469.16, "r_y2": 93.76, "r_x3": 459.02, "r_y3": 93.76, "coord_origin": "TOPLEFT" }, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 455.42, "t": 99.88, "r": 469.16, "b": 104.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.42, "r_y0": 104.84, "r_x1": 469.16, "r_y1": 104.84, "r_x2": 469.16, "r_y2": 99.88, "r_x3": 455.42, "r_y3": 99.88, "coord_origin": "TOPLEFT" }, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 455.05, "t": 106.0, "r": 469.16, "b": 110.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 455.05, "r_y0": 110.96, "r_x1": 469.16, "r_y1": 110.96, "r_x2": 469.16, "r_y2": 106.0, "r_x3": 455.05, "r_y3": 106.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 467.39, "t": 85.57, "r": 480.65, "b": 90.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 467.39, "r_y0": 90.53, "r_x1": 480.65, "r_y1": 90.53, "r_x2": 480.65, "r_y2": 85.57, "r_x3": 467.39, "r_y3": 85.57, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 160.38, "t": 141.58, "r": 182.63, "b": 146.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.38, "r_y0": 146.54, "r_x1": 182.63, "r_y1": 146.54, "r_x2": 182.63, "r_y2": 141.58, "r_x3": 160.38, "r_y3": 141.58, "coord_origin": "TOPLEFT" }, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 153.74, "t": 94.86, "r": 173.33, "b": 99.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.74, "r_y0": 99.82, "r_x1": 173.33, "r_y1": 99.82, "r_x2": 173.33, "r_y2": 94.86, "r_x3": 153.74, "r_y3": 94.86, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 154.51, "t": 100.98, "r": 173.32, "b": 105.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 105.94, "r_x1": 173.32, "r_y1": 105.94, "r_x2": 173.32, "r_y2": 100.98, "r_x3": 154.51, "r_y3": 100.98, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 155.27, "t": 107.1, "r": 173.33, "b": 112.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.27, "r_y0": 112.06, "r_x1": 173.33, "r_y1": 112.06, "r_x2": 173.33, "r_y2": 107.1, "r_x3": 155.27, "r_y3": 107.1, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 326.41, "t": 107.23, "r": 346.0, "b": 112.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.41, "r_y0": 112.19, "r_x1": 346.0, "r_y1": 112.19, "r_x2": 346.0, "r_y2": 107.23, "r_x3": 326.41, "r_y3": 107.23, "coord_origin": "TOPLEFT" }, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 327.18, "t": 113.35, "r": 345.99, "b": 118.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.18, "r_y0": 118.31, "r_x1": 345.99, "r_y1": 118.31, "r_x2": 345.99, "r_y2": 113.35, "r_x3": 327.18, "r_y3": 113.35, "coord_origin": "TOPLEFT" }, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 327.94, "t": 119.47, "r": 346.0, "b": 124.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.94, "r_y0": 124.43, "r_x1": 346.0, "r_y1": 124.43, "r_x2": 346.0, "r_y2": 119.47, "r_x3": 327.94, "r_y3": 119.47, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 488.99, "t": 104.15, "r": 508.76, "b": 109.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 488.99, "r_y0": 109.11, "r_x1": 508.76, "r_y1": 109.11, "r_x2": 508.76, "r_y2": 104.15, "r_x3": 488.99, "r_y3": 104.15, "coord_origin": "TOPLEFT" }, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 490.19, "t": 110.27, "r": 508.76, "b": 115.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.19, "r_y0": 115.23, "r_x1": 508.76, "r_y1": 115.23, "r_x2": 508.76, "r_y2": 110.27, "r_x3": 490.19, "r_y3": 110.27, "coord_origin": "TOPLEFT" }, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 489.72, "t": 116.39, "r": 508.77, "b": 121.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 489.72, "r_y0": 121.35, "r_x1": 508.77, "r_y1": 121.35, "r_x2": 508.77, "r_y2": 116.39, "r_x3": 489.72, "r_y3": 116.39, "coord_origin": "TOPLEFT" }, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 490.71, "t": 122.51, "r": 508.77, "b": 127.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 490.71, "r_y0": 127.47, "r_x1": 508.77, "r_y1": 127.47, "r_x2": 508.77, "r_y2": 122.51, "r_x3": 490.71, "r_y3": 122.51, "coord_origin": "TOPLEFT" }, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 185.38, "t": 141.71, "r": 202.84, "b": 146.67, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.38, "r_y0": 146.67, "r_x1": 202.84, "r_y1": 146.67, "r_x2": 202.84, "r_y2": 141.71, "r_x3": 185.38, "r_y3": 141.71, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 168.5, "t": 86.14, "r": 197.53, "b": 91.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.5, "r_y0": 91.09, "r_x1": 197.53, "r_y1": 91.09, "r_x2": 197.53, "r_y2": 86.14, "r_x3": 168.5, "r_y3": 86.14, "coord_origin": "TOPLEFT" }, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 357.38, "t": 86.0, "r": 367.4, "b": 90.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.38, "r_y0": 90.95, "r_x1": 367.4, "r_y1": 90.95, "r_x2": 367.4, "r_y2": 86.0, "r_x3": 357.38, "r_y3": 86.0, "coord_origin": "TOPLEFT" }, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 333.73, "t": 141.62, "r": 374.93, "b": 146.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.73, "r_y0": 146.58, "r_x1": 374.93, "r_y1": 146.58, "r_x2": 374.93, "r_y2": 141.62, "r_x3": 333.73, "r_y3": 141.62, "coord_origin": "TOPLEFT" }, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 345.69, "t": 86.06, "r": 355.71, "b": 91.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.69, "r_y0": 91.01, "r_x1": 355.71, "r_y1": 91.01, "r_x2": 355.71, "r_y2": 86.06, "r_x3": 345.69, "r_y3": 86.06, "coord_origin": "TOPLEFT" }, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 508.54, "t": 141.38, "r": 526.01, "b": 146.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 508.54, "r_y0": 146.33, "r_x1": 526.01, "r_y1": 146.33, "r_x2": 526.01, "r_y2": 141.38, "r_x3": 508.54, "r_y3": 141.38, "coord_origin": "TOPLEFT" }, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 510.45, "t": 86.09, "r": 523.71, "b": 91.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 510.45, "r_y0": 91.05, "r_x1": 523.71, "r_y1": 91.05, "r_x2": 523.71, "r_y2": 86.09, "r_x3": 510.45, "r_y3": 86.09, "coord_origin": "TOPLEFT" }, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "caption", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 50.11, "t": 165.5, "r": 545.11, "b": 186.36, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 174.41, "r_x1": 545.11, "r_y1": 174.41, "r_x2": 545.11, "r_y2": 165.5, "r_x3": 50.11, "r_y3": 165.5, "coord_origin": "TOPLEFT" }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 186.36, "r_x1": 513.52, "r_y1": 186.36, "r_x2": 513.52, "r_y2": 177.46, "r_x3": 50.11, "r_y3": 177.46, "coord_origin": "TOPLEFT" }, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity." }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 61.57, "t": 210.93, "r": 286.37, "b": 231.79, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 219.84, "r_x1": 71.15, "r_y1": 219.84, "r_x2": 71.15, "r_y2": 210.93, "r_x3": 61.57, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.54, "r_y0": 219.84, "r_x1": 286.37, "r_y1": 219.84, "r_x2": 286.37, "r_y2": 210.93, "r_x3": 73.54, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 231.79, "r_x1": 87.47, "r_y1": 231.79, "r_x2": 87.47, "r_y2": 222.89, "r_x3": 70.04, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 TableFormer output does not include the table cell content." }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 61.57, "t": 244.07, "r": 286.37, "b": 264.93, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 61.57, "r_y0": 252.98, "r_x1": 71.35, "r_y1": 252.98, "r_x2": 71.35, "r_y2": 244.07, "r_x3": 61.57, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 73.79, "r_y0": 252.98, "r_x1": 286.37, "r_y1": 252.98, "r_x2": 286.37, "r_y2": 244.07, "r_x3": 73.79, "r_y3": 244.07, "coord_origin": "TOPLEFT" }, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 70.04, "r_y0": 264.93, "r_x1": 150.42, "r_y1": 264.93, "r_x2": 150.42, "r_y2": 256.03, "r_x3": 70.04, "r_y3": 256.03, "coord_origin": "TOPLEFT" }, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 50.11, "t": 279.2, "r": 286.37, "b": 395.71, "coord_origin": "TOPLEFT" }, "confidence": 0.977, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 288.11, "r_x1": 286.36, "r_y1": 288.11, "r_x2": 286.36, "r_y2": 279.2, "r_x3": 62.07, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 300.06, "r_x1": 286.37, "r_y1": 300.06, "r_x2": 286.37, "r_y2": 291.16, "r_x3": 50.11, "r_y3": 291.16, "coord_origin": "TOPLEFT" }, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 312.02, "r_x1": 286.37, "r_y1": 312.02, "r_x2": 286.37, "r_y2": 303.11, "r_x3": 50.11, "r_y3": 303.11, "coord_origin": "TOPLEFT" }, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 323.97, "r_x1": 286.37, "r_y1": 323.97, "r_x2": 286.37, "r_y2": 315.07, "r_x3": 50.11, "r_y3": 315.07, "coord_origin": "TOPLEFT" }, "text": "More specifically, PDF documents can be seen as a se-", "orig": "More specifically, PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 335.93, "r_x1": 286.37, "r_y1": 335.93, "r_x2": 286.37, "r_y2": 327.02, "r_x3": 50.11, "r_y3": 327.02, "coord_origin": "TOPLEFT" }, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 347.89, "r_x1": 286.37, "r_y1": 347.89, "r_x2": 286.37, "r_y2": 338.98, "r_x3": 50.11, "r_y3": 338.98, "coord_origin": "TOPLEFT" }, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 359.84, "r_x1": 286.37, "r_y1": 359.84, "r_x2": 286.37, "r_y2": 350.93, "r_x3": 50.11, "r_y3": 350.93, "coord_origin": "TOPLEFT" }, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 371.8, "r_x1": 286.37, "r_y1": 371.8, "r_x2": 286.37, "r_y2": 362.89, "r_x3": 50.11, "r_y3": 362.89, "coord_origin": "TOPLEFT" }, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 383.75, "r_x1": 286.37, "r_y1": 383.75, "r_x2": 286.37, "r_y2": 374.84, "r_x3": 50.11, "r_y3": 374.84, "coord_origin": "TOPLEFT" }, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 395.71, "r_x1": 154.56, "r_y1": 395.71, "r_x2": 154.56, "r_y2": 386.8, "r_x3": 50.11, "r_y3": 386.8, "coord_origin": "TOPLEFT" }, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes." }, { "label": "text", "id": 11, "page_no": 11, "cluster": { "id": 11, "label": "text", "bbox": { "l": 50.11, "t": 399.07, "r": 286.36, "b": 419.93, "coord_origin": "TOPLEFT" }, "confidence": 0.935, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 407.98, "r_x1": 286.36, "r_y1": 407.98, "r_x2": 286.36, "r_y2": 399.07, "r_x3": 62.07, "r_y3": 399.07, "coord_origin": "TOPLEFT" }, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 419.93, "r_x1": 95.49, "r_y1": 419.93, "r_x2": 95.49, "r_y2": 411.03, "r_x3": 50.11, "r_y3": 411.03, "coord_origin": "TOPLEFT" }, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Here is a step-by-step description of the prediction postprocessing:" }, { "label": "list_item", "id": 20, "page_no": 11, "cluster": { "id": 20, "label": "list_item", "bbox": { "l": 50.11, "t": 423.3, "r": 286.37, "b": 456.11, "coord_origin": "TOPLEFT" }, "confidence": 0.828, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 432.2, "r_x1": 69.37, "r_y1": 432.2, "r_x2": 69.37, "r_y2": 423.3, "r_x3": 62.07, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 71.81, "r_y0": 432.2, "r_x1": 286.37, "r_y1": 432.2, "r_x2": 286.37, "r_y2": 423.3, "r_x3": 71.81, "r_y3": 423.3, "coord_origin": "TOPLEFT" }, "text": "Get the minimal grid dimensions - number of rows and", "orig": "Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 444.16, "r_x1": 286.37, "r_y1": 444.16, "r_x2": 286.37, "r_y2": 435.25, "r_x3": 50.11, "r_y3": 435.25, "coord_origin": "TOPLEFT" }, "text": "columns for the predicted table structure. This represents", "orig": "columns for the predicted table structure. This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 456.11, "r_x1": 274.51, "r_y1": 456.11, "r_x2": 274.51, "r_y2": 447.21, "r_x3": 50.11, "r_y3": 447.21, "coord_origin": "TOPLEFT" }, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure." }, { "label": "list_item", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 50.11, "t": 459.48, "r": 286.37, "b": 504.25, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 468.38, "r_x1": 69.54, "r_y1": 468.38, "r_x2": 69.54, "r_y2": 459.48, "r_x3": 62.07, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 77.43, "r_y0": 468.38, "r_x1": 286.36, "r_y1": 468.38, "r_x2": 286.36, "r_y2": 459.48, "r_x3": 77.43, "r_y3": 459.48, "coord_origin": "TOPLEFT" }, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 480.34, "r_x1": 286.37, "r_y1": 480.34, "r_x2": 286.37, "r_y2": 471.43, "r_x3": 50.11, "r_y3": 471.43, "coord_origin": "TOPLEFT" }, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 492.29, "r_x1": 286.37, "r_y1": 492.29, "r_x2": 286.37, "r_y2": 483.39, "r_x3": 50.11, "r_y3": 483.39, "coord_origin": "TOPLEFT" }, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 504.25, "r_x1": 110.7, "r_y1": 504.25, "r_x2": 110.7, "r_y2": 495.34, "r_x3": 50.11, "r_y3": 495.34, "coord_origin": "TOPLEFT" }, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches." }, { "label": "list_item", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 50.11, "t": 507.61, "r": 286.36, "b": 528.47, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 516.52, "r_x1": 69.86, "r_y1": 516.52, "r_x2": 69.86, "r_y2": 507.61, "r_x3": 62.07, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 72.46, "r_y0": 516.52, "r_x1": 286.36, "r_y1": 516.52, "r_x2": 286.36, "r_y2": 507.61, "r_x3": 72.46, "r_y3": 507.61, "coord_origin": "TOPLEFT" }, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 528.47, "r_x1": 226.07, "r_y1": 528.47, "r_x2": 226.07, "r_y2": 519.57, "r_x3": 50.11, "r_y3": 519.57, "coord_origin": "TOPLEFT" }, "text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones." }, { "label": "list_item", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 50.11, "t": 531.84, "r": 286.37, "b": 564.65, "coord_origin": "TOPLEFT" }, "confidence": 0.949, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 540.74, "r_x1": 286.36, "r_y1": 540.74, "r_x2": 286.36, "r_y2": 531.84, "r_x3": 62.07, "r_y3": 531.84, "coord_origin": "TOPLEFT" }, "text": "3.a. If all IOU scores in a column are below the thresh-", "orig": "3.a. If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 552.7, "r_x1": 286.37, "r_y1": 552.7, "r_x2": 286.37, "r_y2": 543.79, "r_x3": 50.11, "r_y3": 543.79, "coord_origin": "TOPLEFT" }, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 564.65, "r_x1": 114.03, "r_y1": 564.65, "r_x2": 114.03, "r_y2": 555.75, "r_x3": 50.11, "r_y3": 555.75, "coord_origin": "TOPLEFT" }, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column." }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 50.11, "t": 568.02, "r": 286.37, "b": 600.83, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 576.92, "r_x1": 69.54, "r_y1": 576.92, "r_x2": 69.54, "r_y2": 568.02, "r_x3": 62.07, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.73, "r_y0": 576.92, "r_x1": 286.37, "r_y1": 576.92, "r_x2": 286.37, "r_y2": 568.02, "r_x3": 76.73, "r_y3": 568.02, "coord_origin": "TOPLEFT" }, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 588.88, "r_x1": 286.37, "r_y1": 588.88, "r_x2": 286.37, "r_y2": 579.97, "r_x3": 50.11, "r_y3": 579.97, "coord_origin": "TOPLEFT" }, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 600.83, "r_x1": 278.7, "r_y1": 600.83, "r_x2": 278.7, "r_y2": 591.93, "r_x3": 50.11, "r_y3": 591.93, "coord_origin": "TOPLEFT" }, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:" }, { "label": "formula", "id": 12, "page_no": 11, "cluster": { "id": 12, "label": "formula", "bbox": { "l": 110.7, "t": 623.44, "r": 286.36, "b": 654.11, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 112.03, "r_y0": 632.84, "r_x1": 157.95, "r_y1": 632.84, "r_x2": 157.95, "r_y2": 623.99, "r_x3": 112.03, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.72, "r_y0": 632.84, "r_x1": 203.5, "r_y1": 632.84, "r_x2": 203.5, "r_y2": 623.99, "r_x3": 160.72, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.58, "r_y0": 640.18, "r_x1": 189.15, "r_y1": 640.18, "r_x2": 189.15, "r_y2": 633.98, "r_x3": 185.58, "r_y3": 633.98, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 203.5, "r_y0": 632.84, "r_x1": 208.48, "r_y1": 632.84, "r_x2": 208.48, "r_y2": 623.44, "r_x3": 203.5, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.48, "r_y0": 632.84, "r_x1": 220.29, "r_y1": 632.84, "r_x2": 220.29, "r_y2": 623.99, "r_x3": 208.48, "r_y3": 623.99, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 632.84, "r_x1": 225.77, "r_y1": 632.84, "r_x2": 225.77, "r_y2": 623.44, "r_x3": 220.79, "r_y3": 623.44, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 110.7, "r_y0": 654.11, "r_x1": 122.51, "r_y1": 654.11, "r_x2": 122.51, "r_y2": 645.26, "r_x3": 110.7, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "D$_{c}$", "orig": "D$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 125.78, "r_y0": 654.11, "r_x1": 133.53, "r_y1": 654.11, "r_x2": 133.53, "r_y2": 645.26, "r_x3": 125.78, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 136.29, "r_y0": 654.11, "r_x1": 156.0, "r_y1": 654.11, "r_x2": 156.0, "r_y2": 645.26, "r_x3": 136.29, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "max", "orig": "max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 156.0, "r_y0": 654.11, "r_x1": 160.98, "r_y1": 654.11, "r_x2": 160.98, "r_y2": 644.7, "r_x3": 156.0, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.98, "r_y0": 654.11, "r_x1": 170.24, "r_y1": 654.11, "r_x2": 170.24, "r_y2": 645.26, "r_x3": 160.98, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 170.74, "r_y0": 654.11, "r_x1": 185.68, "r_y1": 654.11, "r_x2": 185.68, "r_y2": 644.7, "r_x3": 170.74, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "} \u2212", "orig": "} \u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.89, "r_y0": 654.11, "r_x1": 206.05, "r_y1": 654.11, "r_x2": 206.05, "r_y2": 645.26, "r_x3": 187.89, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "min", "orig": "min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.05, "r_y0": 654.11, "r_x1": 211.04, "r_y1": 654.11, "r_x2": 211.04, "r_y2": 644.7, "r_x3": 206.05, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.03, "r_y0": 654.11, "r_x1": 220.29, "r_y1": 654.11, "r_x2": 220.29, "r_y2": 645.26, "r_x3": 211.03, "r_y3": 645.26, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.79, "r_y0": 654.11, "r_x1": 225.77, "r_y1": 654.11, "r_x2": 225.77, "r_y2": 644.7, "r_x3": 220.79, "r_y3": 644.7, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.75, "r_y0": 643.79, "r_x1": 286.36, "r_y1": 643.79, "r_x2": 286.36, "r_y2": 634.89, "r_x3": 274.75, "r_y3": 634.89, "coord_origin": "TOPLEFT" }, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)" }, { "label": "text", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "text", "bbox": { "l": 50.11, "t": 667.35, "r": 286.36, "b": 688.93, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 676.97, "r_x1": 74.45, "r_y1": 676.97, "r_x2": 74.45, "r_y2": 668.07, "r_x3": 50.11, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 78.34, "r_y0": 676.75, "r_x1": 82.65, "r_y1": 676.75, "r_x2": 82.65, "r_y2": 667.91, "r_x3": 78.34, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 86.53, "r_y0": 676.97, "r_x1": 123.63, "r_y1": 676.97, "r_x2": 123.63, "r_y2": 668.07, "r_x3": 86.53, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is one of", "orig": "is one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 127.52, "r_y0": 676.75, "r_x1": 132.5, "r_y1": 676.75, "r_x2": 132.5, "r_y2": 667.35, "r_x3": 127.52, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 132.5, "r_y0": 676.97, "r_x1": 210.7, "r_y1": 676.97, "r_x2": 210.7, "r_y2": 668.07, "r_x3": 132.5, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "left, centroid, right", "orig": "left, centroid, right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.7, "r_y0": 676.75, "r_x1": 215.68, "r_y1": 676.75, "r_x2": 215.68, "r_y2": 667.35, "r_x3": 210.7, "r_y3": 667.35, "coord_origin": "TOPLEFT" }, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 219.56, "r_y0": 676.97, "r_x1": 233.95, "r_y1": 676.97, "r_x2": 233.95, "r_y2": 668.07, "r_x3": 219.56, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 237.83, "r_y0": 676.75, "r_x1": 247.09, "r_y1": 676.75, "r_x2": 247.09, "r_y2": 667.91, "r_x3": 237.83, "r_y3": 667.91, "coord_origin": "TOPLEFT" }, "text": "x$_{c}$", "orig": "x$_{c}$", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.47, "r_y0": 676.97, "r_x1": 286.36, "r_y1": 676.97, "r_x2": 286.36, "r_y2": 668.07, "r_x3": 251.47, "r_y3": 668.07, "coord_origin": "TOPLEFT" }, "text": "is the x-", "orig": "is the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 688.93, "r_x1": 205.89, "r_y1": 688.93, "r_x2": 205.89, "r_y2": 680.02, "r_x3": 50.11, "r_y3": 680.02, "coord_origin": "TOPLEFT" }, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point." }, { "label": "list_item", "id": 13, "page_no": 11, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 50.11, "t": 692.29, "r": 286.36, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 701.2, "r_x1": 69.54, "r_y1": 701.2, "r_x2": 69.54, "r_y2": 692.29, "r_x3": 62.07, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 76.27, "r_y0": 701.2, "r_x1": 286.36, "r_y1": 701.2, "r_x2": 286.36, "r_y2": 692.29, "r_x3": 76.27, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 713.15, "r_x1": 94.6, "r_y1": 713.15, "r_x2": 94.6, "r_y2": 704.25, "r_x3": 50.11, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 97.6, "r_y0": 712.93, "r_x1": 103.29, "r_y1": 712.93, "r_x2": 103.29, "r_y2": 704.09, "r_x3": 97.6, "r_y3": 704.09, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.29, "r_y0": 713.15, "r_x1": 286.36, "r_y1": 713.15, "r_x2": 286.36, "r_y2": 704.25, "r_x3": 103.29, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-" }, { "label": "text", "id": 16, "page_no": 11, "cluster": { "id": 16, "label": "text", "bbox": { "l": 308.86, "t": 210.93, "r": 545.12, "b": 255.7, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 219.84, "r_x1": 545.12, "r_y1": 219.84, "r_x2": 545.12, "r_y2": 210.93, "r_x3": 308.86, "r_y3": 210.93, "coord_origin": "TOPLEFT" }, "text": "dian cell size for all table cells. The usage of median dur-", "orig": "dian cell size for all table cells. The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 231.79, "r_x1": 545.12, "r_y1": 231.79, "r_x2": 545.12, "r_y2": 222.89, "r_x3": 308.86, "r_y3": 222.89, "coord_origin": "TOPLEFT" }, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 243.75, "r_x1": 545.12, "r_y1": 243.75, "r_x2": 545.12, "r_y2": 234.84, "r_x3": 308.86, "r_y3": 234.84, "coord_origin": "TOPLEFT" }, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 255.7, "r_x1": 339.58, "r_y1": 255.7, "r_x2": 339.58, "r_y2": 246.8, "r_x3": 308.86, "r_y3": 246.8, "coord_origin": "TOPLEFT" }, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal." }, { "label": "list_item", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 308.86, "t": 259.1, "r": 545.11, "b": 279.96, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 268.01, "r_x1": 328.29, "r_y1": 268.01, "r_x2": 328.29, "r_y2": 259.1, "r_x3": 320.82, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.88, "r_y0": 268.01, "r_x1": 545.11, "r_y1": 268.01, "r_x2": 545.11, "r_y2": 259.1, "r_x3": 334.88, "r_y3": 259.1, "coord_origin": "TOPLEFT" }, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 279.96, "r_x1": 338.19, "r_y1": 279.96, "r_x2": 338.19, "r_y2": 271.06, "r_x3": 308.86, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.68, "r_y0": 279.74, "r_x1": 346.38, "r_y1": 279.74, "r_x2": 346.38, "r_y2": 270.9, "r_x3": 340.68, "r_y3": 270.9, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.38, "r_y0": 279.96, "r_x1": 453.72, "r_y1": 279.96, "r_x2": 453.72, "r_y2": 271.06, "r_x3": 346.38, "r_y3": 271.06, "coord_origin": "TOPLEFT" }, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes." }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 308.86, "t": 283.36, "r": 545.12, "b": 387.91, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 292.27, "r_x1": 328.39, "r_y1": 292.27, "r_x2": 328.39, "r_y2": 283.36, "r_x3": 320.82, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.91, "r_y0": 292.27, "r_x1": 545.11, "r_y1": 292.27, "r_x2": 545.11, "r_y2": 283.36, "r_x3": 330.91, "r_y3": 283.36, "coord_origin": "TOPLEFT" }, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 304.22, "r_x1": 545.12, "r_y1": 304.22, "r_x2": 545.12, "r_y2": 295.32, "r_x3": 308.86, "r_y3": 295.32, "coord_origin": "TOPLEFT" }, "text": "corrected bounding boxes and PDF cells. This time use a", "orig": "corrected bounding boxes and PDF cells. This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 316.18, "r_x1": 545.12, "r_y1": 316.18, "r_x2": 545.12, "r_y2": 307.27, "r_x3": 308.86, "r_y3": 307.27, "coord_origin": "TOPLEFT" }, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 328.13, "r_x1": 545.12, "r_y1": 328.13, "r_x2": 545.12, "r_y2": 319.23, "r_x3": 308.86, "r_y3": 319.23, "coord_origin": "TOPLEFT" }, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 340.09, "r_x1": 397.19, "r_y1": 340.09, "r_x2": 397.19, "r_y2": 331.18, "r_x3": 308.86, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 403.66, "r_y0": 340.09, "r_x1": 545.12, "r_y1": 340.09, "r_x2": 545.12, "r_y2": 331.18, "r_x3": 403.66, "r_y3": 331.18, "coord_origin": "TOPLEFT" }, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 352.05, "r_x1": 545.12, "r_y1": 352.05, "r_x2": 545.12, "r_y2": 343.14, "r_x3": 308.86, "r_y3": 343.14, "coord_origin": "TOPLEFT" }, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 364.0, "r_x1": 545.12, "r_y1": 364.0, "r_x2": 545.12, "r_y2": 355.09, "r_x3": 308.86, "r_y3": 355.09, "coord_origin": "TOPLEFT" }, "text": "is preferred. This covers the cases where the PDF cells are", "orig": "is preferred. This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 375.96, "r_x1": 545.12, "r_y1": 375.96, "r_x2": 545.12, "r_y2": 367.05, "r_x3": 308.86, "r_y3": 367.05, "coord_origin": "TOPLEFT" }, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 387.91, "r_x1": 329.61, "r_y1": 387.91, "r_x2": 329.61, "r_y2": 379.0, "r_x3": 308.86, "r_y3": 379.0, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells." }, { "label": "list_item", "id": 17, "page_no": 11, "cluster": { "id": 17, "label": "list_item", "bbox": { "l": 308.86, "t": 391.31, "r": 545.12, "b": 459.99, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 400.22, "r_x1": 328.55, "r_y1": 400.22, "r_x2": 328.55, "r_y2": 391.31, "r_x3": 320.82, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.13, "r_y0": 400.22, "r_x1": 545.12, "r_y1": 400.22, "r_x2": 545.12, "r_y2": 391.31, "r_x3": 331.13, "r_y3": 391.31, "coord_origin": "TOPLEFT" }, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 412.17, "r_x1": 545.12, "r_y1": 412.17, "r_x2": 545.12, "r_y2": 403.27, "r_x3": 308.86, "r_y3": 403.27, "coord_origin": "TOPLEFT" }, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 424.13, "r_x1": 545.12, "r_y1": 424.13, "r_x2": 545.12, "r_y2": 415.22, "r_x3": 308.86, "r_y3": 415.22, "coord_origin": "TOPLEFT" }, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 436.08, "r_x1": 545.12, "r_y1": 436.08, "r_x2": 545.12, "r_y2": 427.18, "r_x3": 308.86, "r_y3": 427.18, "coord_origin": "TOPLEFT" }, "text": "columns pointing to the same PDF column. In such case", "orig": "columns pointing to the same PDF column. In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 448.04, "r_x1": 545.12, "r_y1": 448.04, "r_x2": 545.12, "r_y2": 439.13, "r_x3": 308.86, "r_y3": 439.13, "coord_origin": "TOPLEFT" }, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 459.99, "r_x1": 426.18, "r_y1": 459.99, "r_x2": 426.18, "r_y2": 451.09, "r_x3": 308.86, "r_y3": 451.09, "coord_origin": "TOPLEFT" }, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score." }, { "label": "list_item", "id": 15, "page_no": 11, "cluster": { "id": 15, "label": "list_item", "bbox": { "l": 308.86, "t": 463.39, "r": 545.12, "b": 567.94, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 472.3, "r_x1": 328.67, "r_y1": 472.3, "r_x2": 328.67, "r_y2": 463.39, "r_x3": 320.82, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.29, "r_y0": 472.3, "r_x1": 545.11, "r_y1": 472.3, "r_x2": 545.11, "r_y2": 463.39, "r_x3": 331.29, "r_y3": 463.39, "coord_origin": "TOPLEFT" }, "text": "Pick up the remaining orphan cells. There could be", "orig": "Pick up the remaining orphan cells. There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 484.25, "r_x1": 545.12, "r_y1": 484.25, "r_x2": 545.12, "r_y2": 475.35, "r_x3": 308.86, "r_y3": 475.35, "coord_origin": "TOPLEFT" }, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 496.21, "r_x1": 545.12, "r_y1": 496.21, "r_x2": 545.12, "r_y2": 487.3, "r_x3": 308.86, "r_y3": 487.3, "coord_origin": "TOPLEFT" }, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 508.16, "r_x1": 381.9, "r_y1": 508.16, "r_x2": 381.9, "r_y2": 499.26, "r_x3": 308.86, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 388.7, "r_y0": 508.16, "r_x1": 545.12, "r_y1": 508.16, "r_x2": 545.12, "r_y2": 499.26, "r_x3": 388.7, "r_y3": 499.26, "coord_origin": "TOPLEFT" }, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 520.12, "r_x1": 545.12, "r_y1": 520.12, "r_x2": 545.12, "r_y2": 511.21, "r_x3": 308.86, "r_y3": 511.21, "coord_origin": "TOPLEFT" }, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 532.07, "r_x1": 545.12, "r_y1": 532.07, "r_x2": 545.12, "r_y2": 523.17, "r_x3": 308.86, "r_y3": 523.17, "coord_origin": "TOPLEFT" }, "text": "bounding box on the geometry of the grid. This mapping", "orig": "bounding box on the geometry of the grid. This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 544.03, "r_x1": 545.11, "r_y1": 544.03, "r_x2": 545.11, "r_y2": 535.12, "r_x3": 308.86, "r_y3": 535.12, "coord_origin": "TOPLEFT" }, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 555.98, "r_x1": 545.12, "r_y1": 555.98, "r_x2": 545.12, "r_y2": 547.08, "r_x3": 308.86, "r_y3": 547.08, "coord_origin": "TOPLEFT" }, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 167, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 567.94, "r_x1": 442.22, "r_y1": 567.94, "r_x2": 442.22, "r_y2": 559.03, "r_x3": 308.86, "r_y3": 559.03, "coord_origin": "TOPLEFT" }, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan." }, { "label": "text", "id": 19, "page_no": 11, "cluster": { "id": 19, "label": "text", "bbox": { "l": 308.86, "t": 571.34, "r": 545.12, "b": 604.15, "coord_origin": "TOPLEFT" }, "confidence": 0.846, "cells": [ { "index": 168, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 580.24, "r_x1": 545.11, "r_y1": 580.24, "r_x2": 545.11, "r_y2": 571.34, "r_x3": 320.82, "r_y3": 571.34, "coord_origin": "TOPLEFT" }, "text": "9a. Compute the top and bottom boundary of the hori-", "orig": "9a. Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 169, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 592.2, "r_x1": 471.64, "r_y1": 592.2, "r_x2": 471.64, "r_y2": 583.29, "r_x3": 308.86, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 170, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 474.83, "r_y0": 591.98, "r_x1": 479.72, "r_y1": 591.98, "r_x2": 479.72, "r_y2": 583.13, "r_x3": 474.83, "r_y3": 583.13, "coord_origin": "TOPLEFT" }, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 171, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 483.27, "r_y0": 592.2, "r_x1": 545.12, "r_y1": 592.2, "r_x2": 545.12, "r_y2": 583.29, "r_x3": 483.27, "r_y3": 583.29, "coord_origin": "TOPLEFT" }, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 172, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 604.15, "r_x1": 329.91, "r_y1": 604.15, "r_x2": 329.91, "r_y2": 595.25, "r_x3": 308.86, "r_y3": 595.25, "coord_origin": "TOPLEFT" }, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)." }, { "label": "list_item", "id": 21, "page_no": 11, "cluster": { "id": 21, "label": "list_item", "bbox": { "l": 308.86, "t": 607.55, "r": 545.12, "b": 628.42, "coord_origin": "TOPLEFT" }, "confidence": 0.772, "cells": [ { "index": 173, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 616.46, "r_x1": 332.87, "r_y1": 616.46, "r_x2": 332.87, "r_y2": 607.55, "r_x3": 320.82, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 174, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.93, "r_y0": 616.46, "r_x1": 545.12, "r_y1": 616.46, "r_x2": 545.12, "r_y2": 607.55, "r_x3": 339.93, "r_y3": 607.55, "coord_origin": "TOPLEFT" }, "text": "Intersect the orphan\u2019s bounding box with the row", "orig": "Intersect the orphan\u2019s bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 175, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 628.42, "r_x1": 495.29, "r_y1": 628.42, "r_x2": 495.29, "r_y2": 619.51, "r_x3": 308.86, "r_y3": 619.51, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row." }, { "label": "list_item", "id": 18, "page_no": 11, "cluster": { "id": 18, "label": "list_item", "bbox": { "l": 308.86, "t": 631.81, "r": 545.12, "b": 664.63, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 176, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 640.72, "r_x1": 545.12, "r_y1": 640.72, "r_x2": 545.12, "r_y2": 631.81, "r_x3": 320.82, "r_y3": 631.81, "coord_origin": "TOPLEFT" }, "text": "9c. Compute the left and right boundary of the vertical", "orig": "9c. Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 177, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 652.68, "r_x1": 455.28, "r_y1": 652.68, "r_x2": 455.28, "r_y2": 643.77, "r_x3": 308.86, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 178, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 457.78, "r_y0": 652.46, "r_x1": 463.47, "r_y1": 652.46, "r_x2": 463.47, "r_y2": 643.61, "r_x3": 457.78, "r_y3": 643.61, "coord_origin": "TOPLEFT" }, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 179, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 465.97, "r_y0": 652.68, "r_x1": 545.11, "r_y1": 652.68, "r_x2": 545.11, "r_y2": 643.77, "r_x3": 465.97, "r_y3": 643.77, "coord_origin": "TOPLEFT" }, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 180, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 664.63, "r_x1": 332.38, "r_y1": 664.63, "r_x2": 332.38, "r_y2": 655.72, "r_x3": 308.86, "r_y3": 655.72, "coord_origin": "TOPLEFT" }, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)." }, { "label": "list_item", "id": 22, "page_no": 11, "cluster": { "id": 22, "label": "list_item", "bbox": { "l": 308.86, "t": 668.03, "r": 545.11, "b": 688.89, "coord_origin": "TOPLEFT" }, "confidence": 0.759, "cells": [ { "index": 181, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 676.94, "r_x1": 545.11, "r_y1": 676.94, "r_x2": 545.11, "r_y2": 668.03, "r_x3": 320.82, "r_y3": 668.03, "coord_origin": "TOPLEFT" }, "text": "9d. Intersect the orphan\u2019s bounding box with the column", "orig": "9d. Intersect the orphan\u2019s bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 182, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 688.89, "r_x1": 510.58, "r_y1": 688.89, "r_x2": 510.58, "r_y2": 679.99, "r_x3": 308.86, "r_y3": 679.99, "coord_origin": "TOPLEFT" }, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column." }, { "label": "list_item", "id": 25, "page_no": 11, "cluster": { "id": 25, "label": "list_item", "bbox": { "l": 308.86, "t": 692.29, "r": 545.12, "b": 713.15, "coord_origin": "TOPLEFT" }, "confidence": 0.697, "cells": [ { "index": 183, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.82, "r_y0": 701.2, "r_x1": 545.12, "r_y1": 701.2, "r_x2": 545.12, "r_y2": 692.29, "r_x3": 320.82, "r_y3": 692.29, "coord_origin": "TOPLEFT" }, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 184, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 713.15, "r_x1": 545.12, "r_y1": 713.15, "r_x2": 545.12, "r_y2": 704.25, "r_x3": 308.86, "r_y3": 704.25, "coord_origin": "TOPLEFT" }, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-" } ], "headers": [ { "label": "page_footer", "id": 14, "page_no": 11, "cluster": { "id": 14, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 185, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" } ] } }, { "page_no": 12, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 88.85, "r_y1": 84.11, "r_x2": 88.85, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.07, "r_x1": 286.36, "r_y1": 96.07, "r_x2": 286.36, "r_y2": 87.16, "r_x3": 62.07, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 127.03, "r_y1": 108.02, "r_x2": 127.03, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 119.75, "r_x1": 286.36, "r_y1": 119.75, "r_x2": 286.36, "r_y2": 111.16, "r_x3": 62.07, "r_y3": 111.16, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.71, "r_x1": 234.06, "r_y1": 131.71, "r_x2": 234.06, "r_y2": 123.12, "r_x3": 50.11, "r_y3": 123.12, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.34, "r_y0": 510.96, "r_x1": 273.13, "r_y1": 510.96, "r_x2": 273.13, "r_y2": 502.06, "r_x3": 63.34, "r_y3": 502.06, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 315.5, "r_x1": 345.63, "r_y1": 315.5, "r_x2": 345.63, "r_y2": 306.6, "r_x3": 308.86, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.79, "r_y0": 315.5, "r_x1": 545.12, "r_y1": 315.5, "r_x2": 545.12, "r_y2": 306.6, "r_x3": 352.79, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 327.46, "r_x1": 355.9, "r_y1": 327.46, "r_x2": 355.9, "r_y2": 318.55, "r_x3": 308.86, "r_y3": 318.55, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34, "r_y0": 689.4, "r_x1": 541.63, "r_y1": 689.4, "r_x2": 541.63, "r_y2": 680.49, "r_x3": 312.34, "r_y3": 680.49, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 88.85, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.755, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 88.85, "r_y1": 84.11, "r_x2": 88.85, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 87.16, "r": 286.36, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.07, "r_x1": 286.36, "r_y1": 96.07, "r_x2": 286.36, "r_y2": 87.16, "r_x3": 62.07, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 127.03, "r_y1": 108.02, "r_x2": 127.03, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 111.16, "r": 286.36, "b": 131.71, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 119.75, "r_x1": 286.36, "r_y1": 119.75, "r_x2": 286.36, "r_y2": 111.16, "r_x3": 62.07, "r_y3": 111.16, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.71, "r_x1": 234.06, "r_y1": 131.71, "r_x2": 234.06, "r_y2": 123.12, "r_x3": 50.11, "r_y3": 123.12, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "caption", "bbox": { "l": 63.34, "t": 502.06, "r": 273.13, "b": 510.96, "coord_origin": "TOPLEFT" }, "confidence": 0.897, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.34, "r_y0": 510.96, "r_x1": 273.13, "r_y1": 510.96, "r_x2": 273.13, "r_y2": 502.06, "r_x3": 63.34, "r_y3": 502.06, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 306.6, "r": 545.12, "b": 327.46, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 315.5, "r_x1": 345.63, "r_y1": 315.5, "r_x2": 345.63, "r_y2": 306.6, "r_x3": 308.86, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.79, "r_y0": 315.5, "r_x1": 545.12, "r_y1": 315.5, "r_x2": 545.12, "r_y2": 306.6, "r_x3": 352.79, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 327.46, "r_x1": 355.9, "r_y1": 327.46, "r_x2": 355.9, "r_y2": 318.55, "r_x3": 308.86, "r_y3": 318.55, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 312.34, "t": 680.49, "r": 541.63, "b": 689.4, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34, "r_y0": 689.4, "r_x1": 541.63, "r_y1": 689.4, "r_x2": 541.63, "r_y2": 680.49, "r_x3": 312.34, "r_y3": 680.49, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.902, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "table", "bbox": { "l": 310.33, "t": 101.18, "r": 555.83, "b": 136.15, "coord_origin": "TOPLEFT" }, "confidence": 0.705, "cells": [], "children": [] }, { "id": 32, "label": "table", "bbox": { "l": 309.96, "t": 154.61, "r": 555.75, "b": 184.72, "coord_origin": "TOPLEFT" }, "confidence": 0.564, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 84.03, "t": 156.33, "r": 239.17, "b": 214.39, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [], "children": [] }, { "id": 21, "label": "table", "bbox": { "l": 309.96, "t": 195.71, "r": 555.71, "b": 233.55, "coord_origin": "TOPLEFT" }, "confidence": 0.66, "cells": [], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 82.92, "t": 233.78, "r": 239.19, "b": 291.28, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [], "children": [] }, { "id": 19, "label": "picture", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.696, "cells": [], "children": [] }, { "id": 37, "label": "table", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.528, "cells": [], "children": [] }, { "id": 6, "label": "table", "bbox": { "l": 83.95, "t": 309.05, "r": 239.17, "b": 367.91, "coord_origin": "TOPLEFT" }, "confidence": 0.909, "cells": [], "children": [] }, { "id": 12, "label": "table", "bbox": { "l": 335.27, "t": 388.47, "r": 490.08, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 83.32, "t": 396.01, "r": 248.87, "b": 487.26, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 334.93, "t": 453.95, "r": 490.09, "b": 502.72, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [], "children": [] }, { "id": 5, "label": "table", "bbox": { "l": 335.25, "t": 519.08, "r": 490.22, "b": 567.69, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [], "children": [] }, { "id": 13, "label": "picture", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.802, "cells": [], "children": [] }, { "id": 30, "label": "table", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.593, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "17": { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.33, "t": 101.18, "r": 555.83, "b": 136.15, "coord_origin": "TOPLEFT" }, "confidence": 0.705, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "32": { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.96, "t": 154.61, "r": 555.75, "b": 184.72, "coord_origin": "TOPLEFT" }, "confidence": 0.564, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.03, "t": 156.33, "r": 239.17, "b": 214.39, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "21": { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.96, "t": 195.71, "r": 555.71, "b": 233.55, "coord_origin": "TOPLEFT" }, "confidence": 0.66, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "4": { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92, "t": 233.78, "r": 239.19, "b": 291.28, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "37": { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.528, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "6": { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.95, "t": 309.05, "r": 239.17, "b": 367.91, "coord_origin": "TOPLEFT" }, "confidence": 0.909, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "12": { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.27, "t": 388.47, "r": 490.08, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "0": { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.32, "t": 396.01, "r": 248.87, "b": 487.26, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.93, "t": 453.95, "r": 490.09, "b": 502.72, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "5": { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.25, "t": 519.08, "r": 490.22, "b": 567.69, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "30": { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.593, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "text", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 88.85, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.755, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 88.85, "r_y1": 84.11, "r_x2": 88.85, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "phan cell." }, { "label": "text", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 87.16, "r": 286.36, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.07, "r_x1": 286.36, "r_y1": 96.07, "r_x2": 286.36, "r_y2": 87.16, "r_x3": 62.07, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 127.03, "r_y1": 108.02, "r_x2": 127.03, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell." }, { "label": "text", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 111.16, "r": 286.36, "b": 131.71, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 119.75, "r_x1": 286.36, "r_y1": 119.75, "r_x2": 286.36, "r_y2": 111.16, "r_x3": 62.07, "r_y3": 111.16, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.71, "r_x1": 234.06, "r_y1": 131.71, "r_x2": 234.06, "r_y2": 123.12, "r_x3": 50.11, "r_y3": 123.12, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below." }, { "label": "caption", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 63.34, "t": 502.06, "r": 273.13, "b": 510.96, "coord_origin": "TOPLEFT" }, "confidence": 0.897, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.34, "r_y0": 510.96, "r_x1": 273.13, "r_y1": 510.96, "r_x2": 273.13, "r_y2": 502.06, "r_x3": 63.34, "r_y3": 502.06, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 8: Example of a table with multi-line header." }, { "label": "caption", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 306.6, "r": 545.12, "b": 327.46, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 315.5, "r_x1": 345.63, "r_y1": 315.5, "r_x2": 345.63, "r_y2": 306.6, "r_x3": 308.86, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.79, "r_y0": 315.5, "r_x1": 545.12, "r_y1": 315.5, "r_x2": 545.12, "r_y2": 306.6, "r_x3": 352.79, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 327.46, "r_x1": 355.9, "r_y1": 327.46, "r_x2": 355.9, "r_y2": 318.55, "r_x3": 308.86, "r_y3": 318.55, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 9: Example of a table with big empty distance between cells." }, { "label": "caption", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 312.34, "t": 680.49, "r": 541.63, "b": 689.4, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34, "r_y0": 689.4, "r_x1": 541.63, "r_y1": 689.4, "r_x2": 541.63, "r_y2": 680.49, "r_x3": 312.34, "r_y3": 680.49, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 10: Example of a complex table with empty cells." }, { "label": "page_footer", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.902, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" }, { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.33, "t": 101.18, "r": 555.83, "b": 136.15, "coord_origin": "TOPLEFT" }, "confidence": 0.705, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.96, "t": 154.61, "r": 555.75, "b": 184.72, "coord_origin": "TOPLEFT" }, "confidence": 0.564, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.03, "t": 156.33, "r": 239.17, "b": 214.39, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.96, "t": 195.71, "r": 555.71, "b": 233.55, "coord_origin": "TOPLEFT" }, "confidence": 0.66, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92, "t": 233.78, "r": 239.19, "b": 291.28, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 19, "page_no": 12, "cluster": { "id": 19, "label": "picture", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.696, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.528, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.95, "t": 309.05, "r": 239.17, "b": 367.91, "coord_origin": "TOPLEFT" }, "confidence": 0.909, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.27, "t": 388.47, "r": 490.08, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.32, "t": 396.01, "r": 248.87, "b": 487.26, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.93, "t": 453.95, "r": 490.09, "b": 502.72, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.25, "t": 519.08, "r": 490.22, "b": 567.69, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.802, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.593, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "body": [ { "label": "text", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "text", "bbox": { "l": 50.11, "t": 75.21, "r": 88.85, "b": 84.11, "coord_origin": "TOPLEFT" }, "confidence": 0.755, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 84.11, "r_x1": 88.85, "r_y1": 84.11, "r_x2": 88.85, "r_y2": 75.21, "r_x3": 50.11, "r_y3": 75.21, "coord_origin": "TOPLEFT" }, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "phan cell." }, { "label": "text", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "text", "bbox": { "l": 50.11, "t": 87.16, "r": 286.36, "b": 108.02, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 96.07, "r_x1": 286.36, "r_y1": 96.07, "r_x2": 286.36, "r_y2": 87.16, "r_x3": 62.07, "r_y3": 87.16, "coord_origin": "TOPLEFT" }, "text": "9f. Otherwise create a new structural cell and match it", "orig": "9f. Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 108.02, "r_x1": 127.03, "r_y1": 108.02, "r_x2": 127.03, "r_y2": 99.12, "r_x3": 50.11, "r_y3": 99.12, "coord_origin": "TOPLEFT" }, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell." }, { "label": "text", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "text", "bbox": { "l": 50.11, "t": 111.16, "r": 286.36, "b": 131.71, "coord_origin": "TOPLEFT" }, "confidence": 0.945, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 62.07, "r_y0": 119.75, "r_x1": 286.36, "r_y1": 119.75, "r_x2": 286.36, "r_y2": 111.16, "r_x3": 62.07, "r_y3": 111.16, "coord_origin": "TOPLEFT" }, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 131.71, "r_x1": 234.06, "r_y1": 131.71, "r_x2": 234.06, "r_y2": 123.12, "r_x3": 50.11, "r_y3": 123.12, "coord_origin": "TOPLEFT" }, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below." }, { "label": "caption", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "caption", "bbox": { "l": 63.34, "t": 502.06, "r": 273.13, "b": 510.96, "coord_origin": "TOPLEFT" }, "confidence": 0.897, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 63.34, "r_y0": 510.96, "r_x1": 273.13, "r_y1": 510.96, "r_x2": 273.13, "r_y2": 502.06, "r_x3": 63.34, "r_y3": 502.06, "coord_origin": "TOPLEFT" }, "text": "Figure 8: Example of a table with multi-line header.", "orig": "Figure 8: Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 8: Example of a table with multi-line header." }, { "label": "caption", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "caption", "bbox": { "l": 308.86, "t": 306.6, "r": 545.12, "b": 327.46, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 315.5, "r_x1": 345.63, "r_y1": 315.5, "r_x2": 345.63, "r_y2": 306.6, "r_x3": 308.86, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 352.79, "r_y0": 315.5, "r_x1": 545.12, "r_y1": 315.5, "r_x2": 545.12, "r_y2": 306.6, "r_x3": 352.79, "r_y3": 306.6, "coord_origin": "TOPLEFT" }, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 327.46, "r_x1": 355.9, "r_y1": 327.46, "r_x2": 355.9, "r_y2": 318.55, "r_x3": 308.86, "r_y3": 318.55, "coord_origin": "TOPLEFT" }, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 9: Example of a table with big empty distance between cells." }, { "label": "caption", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 312.34, "t": 680.49, "r": 541.63, "b": 689.4, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.34, "r_y0": 689.4, "r_x1": 541.63, "r_y1": 689.4, "r_x2": 541.63, "r_y2": 680.49, "r_x3": 312.34, "r_y3": 680.49, "coord_origin": "TOPLEFT" }, "text": "Figure 10: Example of a complex table with empty cells.", "orig": "Figure 10: Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 10: Example of a complex table with empty cells." }, { "label": "table", "id": 17, "page_no": 12, "cluster": { "id": 17, "label": "table", "bbox": { "l": 310.33, "t": 101.18, "r": 555.83, "b": 136.15, "coord_origin": "TOPLEFT" }, "confidence": 0.705, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 32, "page_no": 12, "cluster": { "id": 32, "label": "table", "bbox": { "l": 309.96, "t": 154.61, "r": 555.75, "b": 184.72, "coord_origin": "TOPLEFT" }, "confidence": 0.564, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "table", "bbox": { "l": 84.03, "t": 156.33, "r": 239.17, "b": 214.39, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 21, "page_no": 12, "cluster": { "id": 21, "label": "table", "bbox": { "l": 309.96, "t": 195.71, "r": 555.71, "b": 233.55, "coord_origin": "TOPLEFT" }, "confidence": 0.66, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "table", "bbox": { "l": 82.92, "t": 233.78, "r": 239.19, "b": 291.28, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 19, "page_no": 12, "cluster": { "id": 19, "label": "picture", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.696, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 37, "page_no": 12, "cluster": { "id": 37, "label": "table", "bbox": { "l": 309.79, "t": 253.91, "r": 425.96, "b": 292.39, "coord_origin": "TOPLEFT" }, "confidence": 0.528, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "table", "bbox": { "l": 83.95, "t": 309.05, "r": 239.17, "b": 367.91, "coord_origin": "TOPLEFT" }, "confidence": 0.909, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "table", "bbox": { "l": 335.27, "t": 388.47, "r": 490.08, "b": 437.02, "coord_origin": "TOPLEFT" }, "confidence": 0.849, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "table", "bbox": { "l": 83.32, "t": 396.01, "r": 248.87, "b": 487.26, "coord_origin": "TOPLEFT" }, "confidence": 0.961, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "table", "bbox": { "l": 334.93, "t": 453.95, "r": 490.09, "b": 502.72, "coord_origin": "TOPLEFT" }, "confidence": 0.882, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "table", "bbox": { "l": 335.25, "t": 519.08, "r": 490.22, "b": 567.69, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "picture", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.802, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 30, "page_no": 12, "cluster": { "id": 30, "label": "table", "bbox": { "l": 333.96, "t": 593.11, "r": 518.48, "b": 665.49, "coord_origin": "TOPLEFT" }, "confidence": 0.593, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "headers": [ { "label": "page_footer", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.902, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" } ] } }, { "page_no": 13, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.68, "r_x1": 93.05, "r_y1": 365.68, "r_x2": 93.05, "r_y2": 356.77, "r_x3": 50.11, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73, "r_y0": 365.68, "r_x1": 286.37, "r_y1": 365.68, "r_x2": 286.37, "r_y2": 356.77, "r_x3": 103.73, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 377.63, "r_x1": 70.86, "r_y1": 377.63, "r_x2": 70.86, "r_y2": 368.73, "r_x3": 50.11, "r_y3": 368.73, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.62, "r_y0": 680.72, "r_x1": 281.86, "r_y1": 680.72, "r_x2": 281.86, "r_y2": 671.82, "r_x3": 54.62, "r_y3": 671.82, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79, "r_y0": 380.59, "r_x1": 538.19, "r_y1": 380.59, "r_x2": 538.19, "r_y2": 371.68, "r_x3": 315.79, "r_y3": 371.68, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98, "r_y0": 692.45, "r_x1": 508.99, "r_y1": 692.45, "r_x2": 508.99, "r_y2": 683.55, "r_x3": 344.98, "r_y3": 683.55, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 356.77, "r": 286.37, "b": 377.63, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.68, "r_x1": 93.05, "r_y1": 365.68, "r_x2": 93.05, "r_y2": 356.77, "r_x3": 50.11, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73, "r_y0": 365.68, "r_x1": 286.37, "r_y1": 365.68, "r_x2": 286.37, "r_y2": 356.77, "r_x3": 103.73, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 377.63, "r_x1": 70.86, "r_y1": 377.63, "r_x2": 70.86, "r_y2": 368.73, "r_x3": 50.11, "r_y3": 368.73, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "caption", "bbox": { "l": 54.62, "t": 671.82, "r": 281.86, "b": 680.72, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.62, "r_y0": 680.72, "r_x1": 281.86, "r_y1": 680.72, "r_x2": 281.86, "r_y2": 671.82, "r_x3": 54.62, "r_y3": 671.82, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "caption", "bbox": { "l": 315.79, "t": 371.68, "r": 538.19, "b": 380.59, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79, "r_y0": 380.59, "r_x1": 538.19, "r_y1": 380.59, "r_x2": 538.19, "r_y2": 371.68, "r_x3": 315.79, "r_y3": 371.68, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 344.98, "t": 683.55, "r": 508.99, "b": 692.45, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98, "r_y0": 692.45, "r_x1": 508.99, "r_y1": 692.45, "r_x2": 508.99, "r_y2": 683.55, "r_x3": 344.98, "r_y3": 683.55, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "picture", "bbox": { "l": 318.63, "t": 90.88, "r": 534.74, "b": 359.06, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [], "children": [] }, { "id": 30, "label": "picture", "bbox": { "l": 51.15, "t": 104.31, "r": 282.86, "b": 344.91, "coord_origin": "TOPLEFT" }, "confidence": 0.561, "cells": [], "children": [] }, { "id": 23, "label": "table", "bbox": { "l": 318.98, "t": 161.23, "r": 534.62, "b": 214.63, "coord_origin": "TOPLEFT" }, "confidence": 0.624, "cells": [], "children": [] }, { "id": 33, "label": "table", "bbox": { "l": 319.01, "t": 226.11, "r": 534.41, "b": 279.86, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [], "children": [] }, { "id": 27, "label": "table", "bbox": { "l": 51.73, "t": 273.61, "r": 283.11, "b": 344.24, "coord_origin": "TOPLEFT" }, "confidence": 0.57, "cells": [], "children": [] }, { "id": 38, "label": "table", "bbox": { "l": 328.14, "t": 288.68, "r": 523.89, "b": 358.27, "coord_origin": "TOPLEFT" }, "confidence": 0.523, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 319.47, "t": 430.9, "r": 518.57, "b": 477.94, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 51.43, "t": 453.49, "r": 310.73, "b": 491.82, "coord_origin": "TOPLEFT" }, "confidence": 0.842, "cells": [], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 319.98, "t": 489.24, "r": 519.1, "b": 535.7, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 50.87, "t": 504.1, "r": 310.61, "b": 542.45, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [], "children": [] }, { "id": 15, "label": "table", "bbox": { "l": 319.83, "t": 546.41, "r": 519.61, "b": 593.11, "coord_origin": "TOPLEFT" }, "confidence": 0.682, "cells": [], "children": [] }, { "id": 6, "label": "table", "bbox": { "l": 51.27, "t": 553.73, "r": 311.09, "b": 591.91, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [], "children": [] }, { "id": 7, "label": "table", "bbox": { "l": 319.06, "t": 609.84, "r": 533.77, "b": 669.19, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [], "children": [] }, { "id": 11, "label": "picture", "bbox": { "l": 50.4, "t": 611.0, "r": 177.06, "b": 656.16, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "23": { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.98, "t": 161.23, "r": 534.62, "b": 214.63, "coord_origin": "TOPLEFT" }, "confidence": 0.624, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "33": { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.01, "t": 226.11, "r": 534.41, "b": 279.86, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "27": { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.73, "t": 273.61, "r": 283.11, "b": 344.24, "coord_origin": "TOPLEFT" }, "confidence": 0.57, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "38": { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.14, "t": 288.68, "r": 523.89, "b": 358.27, "coord_origin": "TOPLEFT" }, "confidence": 0.523, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.47, "t": 430.9, "r": 518.57, "b": 477.94, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.43, "t": 453.49, "r": 310.73, "b": 491.82, "coord_origin": "TOPLEFT" }, "confidence": 0.842, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "8": { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.98, "t": 489.24, "r": 519.1, "b": 535.7, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "4": { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.87, "t": 504.1, "r": 310.61, "b": 542.45, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "15": { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.83, "t": 546.41, "r": 519.61, "b": 593.11, "coord_origin": "TOPLEFT" }, "confidence": 0.682, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "6": { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27, "t": 553.73, "r": 311.09, "b": 591.91, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "7": { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06, "t": 609.84, "r": 533.77, "b": 669.19, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 356.77, "r": 286.37, "b": 377.63, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.68, "r_x1": 93.05, "r_y1": 365.68, "r_x2": 93.05, "r_y2": 356.77, "r_x3": 50.11, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73, "r_y0": 365.68, "r_x1": 286.37, "r_y1": 365.68, "r_x2": 286.37, "r_y2": 356.77, "r_x3": 103.73, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 377.63, "r_x1": 70.86, "r_y1": 377.63, "r_x2": 70.86, "r_y2": 368.73, "r_x3": 50.11, "r_y3": 368.73, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 11: Simple table with different style and empty cells." }, { "label": "caption", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 54.62, "t": 671.82, "r": 281.86, "b": 680.72, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.62, "r_y0": 680.72, "r_x1": 281.86, "r_y1": 680.72, "r_x2": 281.86, "r_y2": 671.82, "r_x3": 54.62, "r_y3": 671.82, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 12: Simple table predictions and post processing." }, { "label": "caption", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "caption", "bbox": { "l": 315.79, "t": 371.68, "r": 538.19, "b": 380.59, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79, "r_y0": 380.59, "r_x1": 538.19, "r_y1": 380.59, "r_x2": 538.19, "r_y2": 371.68, "r_x3": 315.79, "r_y3": 371.68, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 13: Table predictions example on colorful table." }, { "label": "caption", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 344.98, "t": 683.55, "r": 508.99, "b": 692.45, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98, "r_y0": 692.45, "r_x1": 508.99, "r_y1": 692.45, "r_x2": 508.99, "r_y2": 683.55, "r_x3": 344.98, "r_y3": 683.55, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 14: Example with multi-line text." }, { "label": "page_footer", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "picture", "id": 41, "page_no": 13, "cluster": { "id": 41, "label": "picture", "bbox": { "l": 318.63, "t": 90.88, "r": 534.74, "b": 359.06, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 30, "page_no": 13, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 51.15, "t": 104.31, "r": 282.86, "b": 344.91, "coord_origin": "TOPLEFT" }, "confidence": 0.561, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.98, "t": 161.23, "r": 534.62, "b": 214.63, "coord_origin": "TOPLEFT" }, "confidence": 0.624, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.01, "t": 226.11, "r": 534.41, "b": 279.86, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.73, "t": 273.61, "r": 283.11, "b": 344.24, "coord_origin": "TOPLEFT" }, "confidence": 0.57, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.14, "t": 288.68, "r": 523.89, "b": 358.27, "coord_origin": "TOPLEFT" }, "confidence": 0.523, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.47, "t": 430.9, "r": 518.57, "b": 477.94, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.43, "t": 453.49, "r": 310.73, "b": 491.82, "coord_origin": "TOPLEFT" }, "confidence": 0.842, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.98, "t": 489.24, "r": 519.1, "b": 535.7, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.87, "t": 504.1, "r": 310.61, "b": 542.45, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.83, "t": 546.41, "r": 519.61, "b": 593.11, "coord_origin": "TOPLEFT" }, "confidence": 0.682, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27, "t": 553.73, "r": 311.09, "b": 591.91, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06, "t": 609.84, "r": 533.77, "b": 669.19, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 11, "page_no": 13, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 50.4, "t": 611.0, "r": 177.06, "b": 656.16, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 356.77, "r": 286.37, "b": 377.63, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 365.68, "r_x1": 93.05, "r_y1": 365.68, "r_x2": 93.05, "r_y2": 356.77, "r_x3": 50.11, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 103.73, "r_y0": 365.68, "r_x1": 286.37, "r_y1": 365.68, "r_x2": 286.37, "r_y2": 356.77, "r_x3": 103.73, "r_y3": 356.77, "coord_origin": "TOPLEFT" }, "text": "Simple table with different style and empty", "orig": "Simple table with different style and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 377.63, "r_x1": 70.86, "r_y1": 377.63, "r_x2": 70.86, "r_y2": 368.73, "r_x3": 50.11, "r_y3": 368.73, "coord_origin": "TOPLEFT" }, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 11: Simple table with different style and empty cells." }, { "label": "caption", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 54.62, "t": 671.82, "r": 281.86, "b": 680.72, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 54.62, "r_y0": 680.72, "r_x1": 281.86, "r_y1": 680.72, "r_x2": 281.86, "r_y2": 671.82, "r_x3": 54.62, "r_y3": 671.82, "coord_origin": "TOPLEFT" }, "text": "Figure 12: Simple table predictions and post processing.", "orig": "Figure 12: Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 12: Simple table predictions and post processing." }, { "label": "caption", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "caption", "bbox": { "l": 315.79, "t": 371.68, "r": 538.19, "b": 380.59, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 315.79, "r_y0": 380.59, "r_x1": 538.19, "r_y1": 380.59, "r_x2": 538.19, "r_y2": 371.68, "r_x3": 315.79, "r_y3": 371.68, "coord_origin": "TOPLEFT" }, "text": "Figure 13: Table predictions example on colorful table.", "orig": "Figure 13: Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 13: Table predictions example on colorful table." }, { "label": "caption", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 344.98, "t": 683.55, "r": 508.99, "b": 692.45, "coord_origin": "TOPLEFT" }, "confidence": 0.919, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 344.98, "r_y0": 692.45, "r_x1": 508.99, "r_y1": 692.45, "r_x2": 508.99, "r_y2": 683.55, "r_x3": 344.98, "r_y3": 683.55, "coord_origin": "TOPLEFT" }, "text": "Figure 14: Example with multi-line text.", "orig": "Figure 14: Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 14: Example with multi-line text." }, { "label": "picture", "id": 41, "page_no": 13, "cluster": { "id": 41, "label": "picture", "bbox": { "l": 318.63, "t": 90.88, "r": 534.74, "b": 359.06, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 30, "page_no": 13, "cluster": { "id": 30, "label": "picture", "bbox": { "l": 51.15, "t": 104.31, "r": 282.86, "b": 344.91, "coord_origin": "TOPLEFT" }, "confidence": 0.561, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 23, "page_no": 13, "cluster": { "id": 23, "label": "table", "bbox": { "l": 318.98, "t": 161.23, "r": 534.62, "b": 214.63, "coord_origin": "TOPLEFT" }, "confidence": 0.624, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 33, "page_no": 13, "cluster": { "id": 33, "label": "table", "bbox": { "l": 319.01, "t": 226.11, "r": 534.41, "b": 279.86, "coord_origin": "TOPLEFT" }, "confidence": 0.55, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 27, "page_no": 13, "cluster": { "id": 27, "label": "table", "bbox": { "l": 51.73, "t": 273.61, "r": 283.11, "b": 344.24, "coord_origin": "TOPLEFT" }, "confidence": 0.57, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 38, "page_no": 13, "cluster": { "id": 38, "label": "table", "bbox": { "l": 328.14, "t": 288.68, "r": 523.89, "b": 358.27, "coord_origin": "TOPLEFT" }, "confidence": 0.523, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 10, "page_no": 13, "cluster": { "id": 10, "label": "table", "bbox": { "l": 319.47, "t": 430.9, "r": 518.57, "b": 477.94, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 9, "page_no": 13, "cluster": { "id": 9, "label": "table", "bbox": { "l": 51.43, "t": 453.49, "r": 310.73, "b": 491.82, "coord_origin": "TOPLEFT" }, "confidence": 0.842, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 8, "page_no": 13, "cluster": { "id": 8, "label": "table", "bbox": { "l": 319.98, "t": 489.24, "r": 519.1, "b": 535.7, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "table", "bbox": { "l": 50.87, "t": 504.1, "r": 310.61, "b": 542.45, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 15, "page_no": 13, "cluster": { "id": 15, "label": "table", "bbox": { "l": 319.83, "t": 546.41, "r": 519.61, "b": 593.11, "coord_origin": "TOPLEFT" }, "confidence": 0.682, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "table", "bbox": { "l": 51.27, "t": 553.73, "r": 311.09, "b": 591.91, "coord_origin": "TOPLEFT" }, "confidence": 0.887, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "table", "bbox": { "l": 319.06, "t": 609.84, "r": 533.77, "b": 669.19, "coord_origin": "TOPLEFT" }, "confidence": 0.872, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 11, "page_no": 13, "cluster": { "id": 11, "label": "picture", "bbox": { "l": 50.4, "t": 611.0, "r": 177.06, "b": 656.16, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.888, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" } ] } }, { "page_no": 14, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.23, "r_y0": 653.26, "r_x1": 252.24, "r_y1": 653.26, "r_x2": 252.24, "r_y2": 644.35, "r_x3": 84.23, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 661.84, "r_x1": 545.12, "r_y1": 661.84, "r_x2": 545.12, "r_y2": 652.94, "r_x3": 308.86, "r_y3": 652.94, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 673.8, "r_x1": 497.6, "r_y1": 673.8, "r_x2": 497.6, "r_y2": 664.89, "r_x3": 308.86, "r_y3": 664.89, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 84.23, "t": 644.35, "r": 252.24, "b": 653.26, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.23, "r_y0": 653.26, "r_x1": 252.24, "r_y1": 653.26, "r_x2": 252.24, "r_y2": 644.35, "r_x3": 84.23, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "caption", "bbox": { "l": 308.86, "t": 652.94, "r": 545.12, "b": 673.8, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 661.84, "r_x1": 545.12, "r_y1": 661.84, "r_x2": 545.12, "r_y2": 652.94, "r_x3": 308.86, "r_y3": 652.94, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 673.8, "r_x1": 497.6, "r_y1": 673.8, "r_x2": 497.6, "r_y2": 664.89, "r_x3": 308.86, "r_y3": 664.89, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "table", "bbox": { "l": 323.01, "t": 121.55, "r": 525.95, "b": 222.91, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.81, "cells": [], "children": [] }, { "id": 19, "label": "table", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.558, "cells": [], "children": [] }, { "id": 2, "label": "table", "bbox": { "l": 323.38, "t": 241.97, "r": 526.13, "b": 344.09, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [], "children": [] }, { "id": 18, "label": "picture", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.567, "cells": [], "children": [] }, { "id": 10, "label": "table", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.775, "cells": [], "children": [] }, { "id": 20, "label": "picture", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.552, "cells": [], "children": [] }, { "id": 9, "label": "table", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.776, "cells": [], "children": [] }, { "id": 5, "label": "picture", "bbox": { "l": 55.42, "t": 384.56, "r": 280.23, "b": 497.56, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [], "children": [] }, { "id": 22, "label": "picture", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.548, "cells": [], "children": [] }, { "id": 8, "label": "table", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.781, "cells": [], "children": [] }, { "id": 7, "label": "picture", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [], "children": [] }, { "id": 11, "label": "table", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.684, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": { "4": { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.01, "t": 121.55, "r": 525.95, "b": 222.91, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "19": { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.558, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "2": { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.38, "t": 241.97, "r": 526.13, "b": 344.09, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "10": { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.775, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "9": { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.776, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "8": { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, "11": { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.684, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 14, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 84.23, "t": 644.35, "r": 252.24, "b": 653.26, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.23, "r_y0": 653.26, "r_x1": 252.24, "r_y1": 653.26, "r_x2": 252.24, "r_y2": 644.35, "r_x3": 84.23, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 15: Example with triangular table." }, { "label": "caption", "id": 1, "page_no": 14, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 308.86, "t": 652.94, "r": 545.12, "b": 673.8, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 661.84, "r_x1": 545.12, "r_y1": 661.84, "r_x2": 545.12, "r_y2": 652.94, "r_x3": 308.86, "r_y3": 652.94, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 673.8, "r_x1": 497.6, "r_y1": 673.8, "r_x2": 497.6, "r_y2": 664.89, "r_x3": 308.86, "r_y3": 664.89, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact." }, { "label": "page_footer", "id": 3, "page_no": 14, "cluster": { "id": 3, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15" }, { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.01, "t": 121.55, "r": 525.95, "b": 222.91, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 6, "page_no": 14, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.81, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.558, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.38, "t": 241.97, "r": 526.13, "b": 344.09, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 18, "page_no": 14, "cluster": { "id": 18, "label": "picture", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.567, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.775, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 20, "page_no": 14, "cluster": { "id": 20, "label": "picture", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.552, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.776, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 5, "page_no": 14, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 55.42, "t": 384.56, "r": 280.23, "b": 497.56, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 22, "page_no": 14, "cluster": { "id": 22, "label": "picture", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.548, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 7, "page_no": 14, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.684, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "body": [ { "label": "caption", "id": 0, "page_no": 14, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 84.23, "t": 644.35, "r": 252.24, "b": 653.26, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 84.23, "r_y0": 653.26, "r_x1": 252.24, "r_y1": 653.26, "r_x2": 252.24, "r_y2": 644.35, "r_x3": 84.23, "r_y3": 644.35, "coord_origin": "TOPLEFT" }, "text": "Figure 15: Example with triangular table.", "orig": "Figure 15: Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 15: Example with triangular table." }, { "label": "caption", "id": 1, "page_no": 14, "cluster": { "id": 1, "label": "caption", "bbox": { "l": 308.86, "t": 652.94, "r": 545.12, "b": 673.8, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 661.84, "r_x1": 545.12, "r_y1": 661.84, "r_x2": 545.12, "r_y2": 652.94, "r_x3": 308.86, "r_y3": 652.94, "coord_origin": "TOPLEFT" }, "text": "Figure 16: Example of how post-processing helps to restore", "orig": "Figure 16: Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 308.86, "r_y0": 673.8, "r_x1": 497.6, "r_y1": 673.8, "r_x2": 497.6, "r_y2": 664.89, "r_x3": 308.86, "r_y3": 664.89, "coord_origin": "TOPLEFT" }, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact." }, { "label": "table", "id": 4, "page_no": 14, "cluster": { "id": 4, "label": "table", "bbox": { "l": 323.01, "t": 121.55, "r": 525.95, "b": 222.91, "coord_origin": "TOPLEFT" }, "confidence": 0.857, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 6, "page_no": 14, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.81, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 19, "page_no": 14, "cluster": { "id": 19, "label": "table", "bbox": { "l": 55.12, "t": 136.26, "r": 279.37, "b": 249.33, "coord_origin": "TOPLEFT" }, "confidence": 0.558, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "table", "id": 2, "page_no": 14, "cluster": { "id": 2, "label": "table", "bbox": { "l": 323.38, "t": 241.97, "r": 526.13, "b": 344.09, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 18, "page_no": 14, "cluster": { "id": 18, "label": "picture", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.567, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 10, "page_no": 14, "cluster": { "id": 10, "label": "table", "bbox": { "l": 54.28, "t": 260.26, "r": 279.26, "b": 373.53, "coord_origin": "TOPLEFT" }, "confidence": 0.775, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 20, "page_no": 14, "cluster": { "id": 20, "label": "picture", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.552, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 9, "page_no": 14, "cluster": { "id": 9, "label": "table", "bbox": { "l": 323.47, "t": 362.45, "r": 525.96, "b": 464.26, "coord_origin": "TOPLEFT" }, "confidence": 0.776, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 5, "page_no": 14, "cluster": { "id": 5, "label": "picture", "bbox": { "l": 55.42, "t": 384.56, "r": 280.23, "b": 497.56, "coord_origin": "TOPLEFT" }, "confidence": 0.841, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "picture", "id": 22, "page_no": 14, "cluster": { "id": 22, "label": "picture", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.548, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 8, "page_no": 14, "cluster": { "id": 8, "label": "table", "bbox": { "l": 353.69, "t": 487.41, "r": 495.43, "b": 635.77, "coord_origin": "TOPLEFT" }, "confidence": 0.781, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] }, { "label": "picture", "id": 7, "page_no": 14, "cluster": { "id": 7, "label": "picture", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.806, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "table", "id": 11, "page_no": 14, "cluster": { "id": 11, "label": "table", "bbox": { "l": 50.65, "t": 505.98, "r": 319.91, "b": 631.26, "coord_origin": "TOPLEFT" }, "confidence": 0.684, "cells": [], "children": [] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 0, "num_cols": 0, "table_cells": [] } ], "headers": [ { "label": "page_footer", "id": 3, "page_no": 14, "cluster": { "id": 3, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15" } ] } }, { "page_no": 15, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 517.24, "r_x1": 545.11, "r_y1": 517.24, "r_x2": 545.11, "r_y2": 508.34, "r_x3": 50.11, "r_y3": 508.34, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 529.2, "r_x1": 173.24, "r_y1": 529.2, "r_x2": 173.24, "r_y2": 520.29, "r_x3": 50.11, "r_y3": 520.29, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 508.34, "r": 545.11, "b": 529.2, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 517.24, "r_x1": 545.11, "r_y1": 517.24, "r_x2": 545.11, "r_y2": 508.34, "r_x3": 50.11, "r_y3": 508.34, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 529.2, "r_x1": 173.24, "r_y1": 529.2, "r_x2": 173.24, "r_y2": 520.29, "r_x3": 50.11, "r_y3": 520.29, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "picture", "bbox": { "l": 66.8, "t": 253.62, "r": 528.56, "b": 498.14, "coord_origin": "TOPLEFT" }, "confidence": 0.691, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "caption", "id": 0, "page_no": 15, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 508.34, "r": 545.11, "b": 529.2, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 517.24, "r_x1": 545.11, "r_y1": 517.24, "r_x2": 545.11, "r_y2": 508.34, "r_x3": 50.11, "r_y3": 508.34, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 529.2, "r_x1": 173.24, "r_y1": 529.2, "r_x2": 173.24, "r_y2": 520.29, "r_x3": 50.11, "r_y3": 520.29, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure." }, { "label": "page_footer", "id": 1, "page_no": 15, "cluster": { "id": 1, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16" }, { "label": "picture", "id": 2, "page_no": 15, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 66.8, "t": 253.62, "r": 528.56, "b": 498.14, "coord_origin": "TOPLEFT" }, "confidence": 0.691, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 0, "page_no": 15, "cluster": { "id": 0, "label": "caption", "bbox": { "l": 50.11, "t": 508.34, "r": 545.11, "b": 529.2, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 517.24, "r_x1": 545.11, "r_y1": 517.24, "r_x2": 545.11, "r_y2": 508.34, "r_x3": 50.11, "r_y3": 508.34, "coord_origin": "TOPLEFT" }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 50.11, "r_y0": 529.2, "r_x1": 173.24, "r_y1": 529.2, "r_x2": 173.24, "r_y2": 520.29, "r_x3": 50.11, "r_y3": 520.29, "coord_origin": "TOPLEFT" }, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure." }, { "label": "picture", "id": 2, "page_no": 15, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 66.8, "t": 253.62, "r": 528.56, "b": 498.14, "coord_origin": "TOPLEFT" }, "confidence": 0.691, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_footer", "id": 1, "page_no": 15, "cluster": { "id": 1, "label": "page_footer", "bbox": { "l": 292.63, "t": 734.13, "r": 302.59, "b": 743.04, "coord_origin": "TOPLEFT" }, "confidence": 0.913, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.63, "r_y0": 743.04, "r_x1": 302.59, "r_y1": 743.04, "r_x2": 302.59, "r_y2": 734.13, "r_x3": 292.63, "r_y3": 734.13, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16" } ] } } ]